import pandas as pd
import numpy as np
import matplotlib.pyplot as plt
import seaborn as sns
import xgboost as xgb
import imblearn
import os
import pickle
import shap

from pathlib import Path
from scipy import stats
from scipy.stats import norm
from sklearn.ensemble import ExtraTreesClassifier, RandomForestClassifier
from sklearn.neural_network import MLPClassifier
from sklearn.preprocessing import MinMaxScaler, StandardScaler
from sklearn.model_selection import train_test_split, RandomizedSearchCV, GridSearchCV
from sklearn.metrics import classification_report, confusion_matrix, accuracy_score, roc_curve, roc_auc_score
from collections import Counter
from imblearn.over_sampling import SMOTE

%matplotlib inline


wines = pd.read_csv('Data/winequality-white.csv', sep = ';')


wines.head()


wines.describe()


wines.dtypes

fixed acidity           float64
volatile acidity        float64
citric acid             float64
residual sugar          float64
chlorides               float64
free sulfur dioxide     float64
total sulfur dioxide    float64
density                 float64
pH                      float64
sulphates               float64
alcohol                 float64
quality                   int64
dtype: object


# Verificando se contem valor NA no dataset
wines.isna().sum()

fixed acidity           0
volatile acidity        0
citric acid             0
residual sugar          0
chlorides               0
free sulfur dioxide     0
total sulfur dioxide    0
density                 0
pH                      0
sulphates               0
alcohol                 0
quality                 0
dtype: int64


'''
    Função do repositorio: https://gist.github.com/anisayari/2d54c43044d7bb1b29c72c832a0fb1d8#file-reduce_mem_usage-py
    Auxilia na redução de memoria do dataframe, adaptando os tipos de cada variavel.
'''
def reduce_mem_usage(df):
    """ iterate through all the columns of a dataframe and modify the data type
        to reduce memory usage.
    """
    start_mem = df.memory_usage().sum() / 1024 ** 2
    print('Memory usage of dataframe is {:.2f} MB'.format(start_mem))

    for col in df.columns:
        col_type = df[col].dtype

        if col_type != object:
            c_min = df[col].min()
            c_max = df[col].max()
            if str(col_type)[:3] == 'int':
                if c_min > np.iinfo(np.int8).min and c_max < np.iinfo(np.int8).max:
                    df[col] = df[col].astype(np.int8)
                elif c_min > np.iinfo(np.int16).min and c_max < np.iinfo(np.int16).max:
                    df[col] = df[col].astype(np.int16)
                elif c_min > np.iinfo(np.int32).min and c_max < np.iinfo(np.int32).max:
                    df[col] = df[col].astype(np.int32)
                elif c_min > np.iinfo(np.int64).min and c_max < np.iinfo(np.int64).max:
                    df[col] = df[col].astype(np.int64)
            else:
                if c_min > np.finfo(np.float16).min and c_max < np.finfo(np.float16).max:
                    df[col] = df[col].astype(np.float16)
                elif c_min > np.finfo(np.float32).min and c_max < np.finfo(np.float32).max:
                    df[col] = df[col].astype(np.float32)
                else:
                    df[col] = df[col].astype(np.float64)
        else:
            df[col] = df[col].astype('category')

    end_mem = df.memory_usage().sum() / 1024 ** 2
    print('Memory usage after optimization is: {:.2f} MB'.format(end_mem))
    print('Decreased by {:.1f}%'.format(100 * (start_mem - end_mem) / start_mem))

    return df


#wines = reduce_mem_usage(wines)


# Verificando se foi alterado o valor de alguma variavel por engano
#wines.describe()


wines.corr()


plt.figure(figsize = (10, 10))
sns.heatmap(wines.corr(), annot =  True)
plt.show()


# Definindo range de X e Y
x_range = [wines['fixed acidity'].min(), wines['fixed acidity'].max()]
y_range = [wines['quality'].min(), wines['quality'].max()]

# Scatter plot de X e Y
scatter_plot = wines.plot(kind = 'scatter', x = 'fixed acidity', y = 'quality', xlim = x_range, ylim = y_range)

# Traçar linha da media de X e Y
meanY = scatter_plot.plot(x_range, [wines['quality'].mean(), wines['quality'].mean()], '--', color = 'red', linewidth = 1)
meanX = scatter_plot.plot([wines['fixed acidity'].mean(), wines['fixed acidity'].mean()], y_range, '--', color = 'red', linewidth = 1)


def scatter_plot_conjunto(data, columns, target):
    # Definindo range de Y
    y_range = [data[target].min(), data[target].max()]
    
    for column in columns:
        if target != column:
            # Definindo range de X
            x_range = [data[column].min(), data[column].max()]
            
            # Scatter plot de X e Y
            scatter_plot = data.plot(kind = 'scatter', x = column, y = target, xlim = x_range, ylim = y_range)
            
            # Traçar linha da media de X e Y
            meanX = scatter_plot.plot(x_range, [data[target].mean(), data[target].mean()], '--', color = 'red', linewidth = 1)
            meanY = scatter_plot.plot([data[column].mean(), data[column].mean()], y_range, '--', color = 'red', linewidth = 1)


columns = wines.keys()
scatter_plot_conjunto(wines, columns, 'quality')


X = wines.iloc[:, :-1]
y = wines['quality'].values

corr = np.corrcoef(X, rowvar = 0)
eigenvalues, eigenvectors = np.linalg.eig(corr)


print(eigenvalues)

[3.22225389 0.02064909 1.57523993 0.28948714 0.41414367 1.22167134
 0.59935848 0.72659802 0.93874151 0.97333458 1.01852235]


print(eigenvectors[:, 1])

[-0.17129048 -0.01705666 -0.00972112 -0.49022593 -0.02539945  0.03090844
 -0.03556095  0.75977937 -0.1411972  -0.04183284  0.35796133]


print(columns[3], columns[7], columns[10])

residual sugar density alcohol


print(columns[0], columns[3], columns[7], columns[8], columns[10])

fixed acidity residual sugar density pH alcohol


scatter_plot_conjunto(wines, ['residual sugar', 'alcohol'], 'density')


scatter_plot_conjunto(wines, ['fixed acidity'], 'pH')


def boxplot_plot_conjunto(data, columns, target):
    for column in columns:
        if column != target:
            sns.boxplot(x = target, y = column, data = data)


boxplot_plot_conjunto(wines, columns, 'quality')


print(columns)

Index(['fixed acidity', 'volatile acidity', 'citric acid', 'residual sugar',
       'chlorides', 'free sulfur dioxide', 'total sulfur dioxide', 'density',
       'pH', 'sulphates', 'alcohol', 'quality'],
      dtype='object')


print(wines[columns].skew())

fixed acidity           0.647751
volatile acidity        1.576980
citric acid             1.281920
residual sugar          1.077094
chlorides               5.023331
free sulfur dioxide     1.406745
total sulfur dioxide    0.390710
density                 0.977773
pH                      0.457783
sulphates               0.977194
alcohol                 0.487342
quality                 0.155796
dtype: float64


print(wines[columns].kurtosis())

fixed acidity            2.172178
volatile acidity         5.091626
citric acid              6.174901
residual sugar           3.469820
chlorides               37.564600
free sulfur dioxide     11.466342
total sulfur dioxide     0.571853
density                  9.793807
pH                       0.530775
sulphates                1.590930
alcohol                 -0.698425
quality                  0.216526
dtype: float64


def boxplot_individuais(data, columns):
    for column in columns:
        sns.boxplot(x = data[column])
        plt.show()


boxplot_individuais(wines, columns)


def hist_individual(data, columns):
    for column in columns:
        data[column].hist(label = column)
        plt.title(column)
        plt.show()


hist_individual(wines, columns)


# Criando variavel com todas colunas possuem outlier
outlier_columns = columns.copy().to_list()
outlier_columns.remove('alcohol')
print(outlier_columns)

['fixed acidity', 'volatile acidity', 'citric acid', 'residual sugar', 'chlorides', 'free sulfur dioxide', 'total sulfur dioxide', 'density', 'pH', 'sulphates', 'quality']


def outlier_percentil_based(data, columns):
    for column in columns:
        # Capturando percentile de 10 e 90
        percentil10 = data[column].quantile(0.10)
        percentil90 = data[column].quantile(0.90)
        
        data[column] = np.where(data[column] < percentil10, percentil10, data[column])
        data[column] = np.where(data[column] > percentil90, percentil90, data[column])
        
    return data


def outlier_log_transformation_based(data, columns):
    for column in columns:
        data[column] = data[column].map(lambda x: np.log(x) if x > 0 else 0)
    return data


def outlier_median_based(data, columns, bottom = False):
    for column in columns:
        percentil50 = data[column].quantile(0.50)
        percentil95 = data[column].quantile(0.95)
        percentil05 = data[column].quantile(0.05)
        
        data[column] = np.where(data[column]  > percentil95, percentil50, data[column])
        
        if bottom:
            data[column] = np.where(data[column]  < percentil05, percentil50, data[column])
        
    return data


wines = outlier_median_based(wines, outlier_columns, bottom =  True)


print(wines.skew())

fixed acidity           0.251616
volatile acidity        0.557183
citric acid             0.592357
residual sugar          0.647903
chlorides               0.283003
free sulfur dioxide     0.260288
total sulfur dioxide    0.270364
density                 0.256463
pH                      0.239489
sulphates               0.537369
alcohol                 0.487342
quality                 0.150855
dtype: float64


print(wines.kurtosis())

fixed acidity          -0.366659
volatile acidity       -0.084250
citric acid             0.007458
residual sugar         -0.682921
chlorides              -0.280081
free sulfur dioxide    -0.587664
total sulfur dioxide   -0.630729
density                -0.778132
pH                     -0.416221
sulphates              -0.158999
alcohol                -0.698425
quality                -0.852576
dtype: float64


boxplot_individuais(wines, columns)


hist_individual(wines, columns)


modelo = xgb.XGBClassifier(n_estimators = 1000)


X = wines.iloc[:, :-1]
y = wines['quality'].values

modelo.fit(X, y)

The use of label encoder in XGBClassifier is deprecated and will be removed in a future release. To remove this warning, do the following: 1) Pass option use_label_encoder=False when constructing XGBClassifier object; and 2) Encode your labels (y) as integers starting with 0, i.e. 0, 1, 2, ..., [num_class - 1].

[18:07:33] WARNING: C:/Users/Administrator/workspace/xgboost-win64_release_1.4.0/src/learner.cc:1095: Starting in XGBoost 1.3.0, the default evaluation metric used with the objective 'multi:softprob' was changed from 'merror' to 'mlogloss'. Explicitly set eval_metric if you'd like to restore the old behavior.

XGBClassifier(base_score=0.5, booster='gbtree', colsample_bylevel=1,
              colsample_bynode=1, colsample_bytree=1, gamma=0, gpu_id=-1,
              importance_type='gain', interaction_constraints='',
              learning_rate=0.300000012, max_delta_step=0, max_depth=6,
              min_child_weight=1, missing=nan, monotone_constraints='()',
              n_estimators=1000, n_jobs=24, num_parallel_tree=1,
              objective='multi:softprob', random_state=0, reg_alpha=0,
              reg_lambda=1, scale_pos_weight=None, subsample=1,
              tree_method='exact', validate_parameters=1, verbosity=None)


print(modelo.feature_importances_)

[0.07764331 0.1092582  0.0794206  0.07777265 0.07772369 0.08010259
 0.07427387 0.0755174  0.07766463 0.07655106 0.19407198]


index_ordenado = modelo.feature_importances_.argsort()


plt.barh(wines.drop('quality', axis = 1).columns[index_ordenado], modelo.feature_importances_[index_ordenado])

<BarContainer object of 11 artists>


# Variaveis selecionas antes da padronização
wines = wines[['chlorides', 'residual sugar', 'citric acid', 'free sulfur dioxide', 'volatile acidity', 'alcohol', 'quality']]

# Variaveis selecionadas após a padronização
#wines = wines[['pH', 'chlorides', 'fixed acidity', 'citric acid', 'volatile acidity', 'alcohol', 'quality']]

wines.head()


# Variaveis selecionanas apartir da analise humana
'''
# Removendo colunas 'residual sugar', 'pH' e 'alcohol' para evitar multicolinearidade
wines = wines.drop(['residual sugar', 'pH'], axis = 1)

# Removendo colunas que não possuem alta correlação com a variavel target 'quality'
wines = wines.drop(['citric acid', 'free sulfur dioxide'], axis = 1)
'''

"\n# Removendo colunas 'residual sugar', 'pH' e 'alcohol' para evitar multicolinearidade\nwines = wines.drop(['residual sugar', 'pH'], axis = 1)\n\n# Removendo colunas que não possuem alta correlação com a variavel target 'quality'\nwines = wines.drop(['citric acid', 'free sulfur dioxide'], axis = 1)\n"


X = wines.iloc[:, :-1]
y = wines['quality'].values


X.head()


print(y)

[6. 6. 6. ... 6. 7. 6.]


# Normalização
# scaler = MinMaxScaler()
# X_scaled = scaler.fit_transform(X)

# Padronização
scaler = StandardScaler()
X_scaled = scaler.fit_transform(X)


print(X_scaled)

[[ 0.22249857 -0.17103245  0.4192587   0.84562416  0.01863979 -1.39315246]
 [ 0.69927775 -1.03862093  0.16155284 -1.64831341  0.4520149  -0.82427568]
 [ 0.81847254  0.23866211  0.93467042 -0.36111982  0.16309816 -0.33666701]
 ...
 [-0.25428061 -1.13501965 -1.77124108 -0.36111982 -0.41473532 -0.90554379]
 [-0.01589102 -1.15911933 -0.35385887 -1.16561581  0.30755653  1.85757201]
 [-0.01589102 -0.17103245  0.67696456 -1.00471661 -0.84811044  1.04489089]]


plt.hist(X_scaled[:,0:1])

(array([ 439.,  396.,  814., 1123.,  723.,  592.,  394.,  245.,  113.,
          59.]),
 array([-1.92300773, -1.44622855, -0.96944937, -0.4926702 , -0.01589102,
         0.46088816,  0.93766734,  1.41444652,  1.8912257 ,  2.36800487,
         2.84478405]),
 <BarContainer object of 10 artists>)


y_list = []


# Valores acima de 6.5 serão classificados como Bom, ou seja 1. Valores abaixo de 6.5 serão Ruim, ou seja 0.

for i in range(0, len(y)):
    if y[i] >= 6.5:
        y_list.append(1) # Good
    else:
        y_list.append(0) # Bad


print(y_list)

[0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 1, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 0, 0, 1, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 1, 0, 0, 0, 0, 0, 0, 1, 0, 0, 1, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 1, 0, 0, 0, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 0, 0, 1, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 1, 0, 0, 0, 0, 0, 0, 0, 1, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 0, 0, 0, 0, 0, 1, 0, 0, 0, 1, 1, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 0, 1, 1, 0, 0, 0, 1, 1, 1, 0, 0, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 1, 0, 0, 1, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 1, 1, 1, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 1, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 1, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 1, 0, 1, 1, 0, 0, 1, 1, 1, 0, 0, 0, 0, 1, 0, 0, 1, 1, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 0, 1, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 0, 0, 0, 0, 0, 0, 1, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 1, 1, 0, 0, 0, 0, 1, 0, 1, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 1, 0, 0, 0, 1, 0, 0, 0, 0, 0, 1, 0, 0, 1, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 0, 0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 0, 1, 0, 0, 1, 0, 0, 0, 0, 1, 0, 1, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 1, 0, 0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 1, 1, 0, 0, 0, 0, 0, 0, 1, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 0, 0, 1, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 0, 1, 0, 0, 0, 0, 1, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 0, 0, 1, 0, 0, 0, 0, 1, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 1, 1, 0, 1, 0, 1, 0, 0, 1, 0, 0, 0, 0, 1, 0, 0, 0, 1, 0, 0, 0, 0, 1, 0, 0, 0, 1, 0, 0, 0, 1, 0, 1, 0, 0, 0, 0, 0, 1, 0, 1, 1, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 1, 1, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 1, 0, 1, 0, 0, 1, 1, 0, 1, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 1, 0, 1, 0, 0, 0, 0, 1, 1, 0, 0, 0, 0, 0, 1, 0, 0, 1, 1, 1, 0, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 1, 0, 0, 1, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 1, 0, 0, 1, 0, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 0, 0, 1, 1, 0, 0, 0, 0, 0, 0, 0, 1, 0, 1, 1, 0, 0, 1, 0, 0, 0, 0, 0, 1, 0, 0, 1, 1, 0, 0, 1, 0, 1, 1, 0, 0, 0, 0, 1, 0, 1, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 0, 1, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 1, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 1, 0, 0, 1, 0, 0, 1, 0, 1, 0, 0, 0, 0, 0, 0, 1, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 1, 0, 1, 0, 0, 1, 1, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 0, 1, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 1, 0, 0, 1, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 1, 1, 1, 1, 0, 1, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 1, 1, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 1, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 0, 0, 0, 1, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 1, 0, 1, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 1, 1, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 1, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 1, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 0, 0, 1, 1, 0, 1, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 1, 0, 1, 0, 0, 0, 1, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 0, 0, 1, 1, 0, 1, 0, 0, 1, 1, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 1, 0, 1, 0, 0, 1, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 1, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 1, 1, 0, 0, 1, 0, 0, 1, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 0, 1, 1, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 1, 1, 1, 1, 1, 1, 0, 1, 0, 0, 1, 0, 0, 1, 0, 0, 0, 0, 0, 1, 0, 0, 1, 1, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 1, 1, 1, 1, 0, 0, 0, 1, 1, 0, 0, 1, 1, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 1, 1, 0, 0, 0, 0, 0, 1, 0, 1, 1, 0, 0, 1, 1, 1, 0, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 1, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 1, 0, 0, 0, 1, 0, 1, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 1, 1, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 1, 0, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 0, 0, 1, 1, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 0, 0, 0, 0, 1, 0, 0, 0, 0, 1, 1, 0, 0, 0, 0, 0, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 0, 1, 0, 0, 0, 0, 0, 0, 0, 1, 1, 0, 0, 1, 0, 1, 0, 1, 0, 0, 0, 0, 0, 0, 1, 0, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 0, 0, 0, 0, 0, 0, 1, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 1, 1, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 0, 0, 0, 1, 1, 1, 1, 0, 1, 1, 1, 1, 1, 0, 0, 0, 1, 1, 1, 1, 1, 1, 0, 0, 0, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 1, 0, 0, 1, 0, 0, 0, 1, 0, 0, 1, 0, 1, 1, 1, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 1, 1, 0, 0, 0, 1, 1, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 1, 0, 0, 1, 0, 0, 0, 0, 0, 1, 0, 1, 1, 1, 0, 1, 1, 0, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 1, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 1, 0, 0, 0, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 0, 0, 0, 1, 0, 0, 0, 0, 1, 0, 0, 1, 1, 1, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 1, 0, 0, 0, 1, 1, 1, 1, 0, 0, 1, 1, 1, 1, 1, 0, 1, 0, 0, 1, 0, 0, 0, 1, 0, 0, 1, 0, 1, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 1, 0, 0, 1, 0, 0, 0, 0, 1, 0, 0, 0, 1, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 1, 1, 1, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 1, 1, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 1, 0, 1, 1, 0, 0, 0, 0, 0, 1, 1, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 1, 0, 0, 0, 1, 0, 1, 0, 0, 0, 0, 1, 0, 1, 1, 0, 1, 1, 0, 0, 1, 1, 0, 0, 1, 1, 1, 0, 1, 0, 0, 0, 1, 0, 0, 0, 1, 1, 1, 0, 1, 0, 1, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 1, 0, 1, 0, 1, 0, 1, 0, 0, 1, 1, 1, 0, 0, 0, 1, 0, 1, 1, 1, 1, 1, 0, 1, 0, 0, 1, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 1, 1, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 1, 1, 1, 0, 0, 0, 0, 0, 1, 0, 1, 1, 0, 0, 0, 0, 0, 0, 0, 1, 1, 0, 1, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 0, 1, 0, 0, 1, 0, 0, 1, 0, 1, 0, 0, 0, 0, 0, 1, 0, 1, 1, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 1, 0, 0, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 1, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 0, 0, 1, 0, 1, 1, 0, 0, 1, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 1, 1, 0, 1, 0, 0, 1, 1, 0, 1, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 0, 1, 1, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 0, 0, 0, 1, 0, 0, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 1, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 1, 1, 0, 1, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 1, 1, 1, 0, 0, 1, 1, 0, 0, 1, 1, 0, 0, 0, 0, 1, 0, 0, 1, 0, 0, 0, 0, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 1, 1, 0, 1, 1, 1, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 1, 0, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 1, 1, 1, 0, 0, 0, 0, 0, 0, 1, 1, 0, 1, 1, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 1, 0, 1, 1, 0, 0, 1, 1, 0, 0, 0, 0, 0, 0, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 1, 1, 1, 0, 0, 0, 1, 0, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 1, 1, 0, 0, 1, 1, 0, 0, 0, 0, 1, 1, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 1, 1, 0, 1, 0, 0, 0, 0, 0, 1, 0, 0, 1, 0, 0, 0, 1, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 1, 1, 0, 0, 0, 0, 1, 1, 0, 0, 0, 1, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 0, 0, 0, 1, 1, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0]


print(Counter(y))

Counter({6.0: 2561, 5.0: 1457, 7.0: 880})


plt.bar(['Bad', 'Good'], [y_list.count(0), y_list.count(1)])
plt.show()


y = np.array(y_list)


print(y)

[0 0 0 ... 0 1 0]


x_train, x_test, y_train, y_test = train_test_split(X_scaled, y, test_size = .3)


count_class_0 = Counter(y_train)[0]
count_class_1 = Counter(y_train)[1]


print(count_class_0, count_class_1)


dt_final = pd.DataFrame(x_train)
dt_final['quality'] = y_train
dt_final.head()


dt_final.shape


dt_class_0 = dt_final[dt_final['quality'] == 0]
dt_class_1 = dt_final[dt_final['quality'] == 1]


dt_class_1_over = dt_class_1.sample(count_class_0, replace = True)


print(dt_class_0.shape, dt_class_1_over.shape)


dt_class_0 = dt_class_0.reset_index(drop = True)
dt_class_1_over = dt_class_1_over.reset_index(drop = True)


dt_final = pd.concat([dt_class_0, dt_class_1_over], axis = 0)


dt_final.shape


dt_final.head()


x_train = dt_final.iloc[:, :-1]
y_train = dt_final['quality'].values


#x_train, x_test, y_train, y_test = train_test_split(X_scaled, y, test_size = .3, stratify = y)
x_train, x_test, y_train, y_test = train_test_split(X_scaled, y, test_size = .1)


print(Counter(y_train))
print(x_train.shape)

Counter({0: 3624, 1: 784})
(4408, 6)


oversample = SMOTE()
x_train, y_train = oversample.fit_resample(x_train, y_train)


print(Counter(y_train))
print(x_train.shape)

Counter({0: 3624, 1: 3624})
(7248, 6)


plt.bar(['Bad', 'Good'], [list(y_train).count(0), list(y_train).count(1)])
plt.show()


print(len(x_train), len(x_test))

7248 490


def report_modelo(modelo, y, pred, label = 'Modelo', save = False):
    target_names = ['Bad',  'Good']
    
    # Forçando predições para um numero inteiro, visto que não faz sentido manter a probabilidade
    pred[pred >  0.5] = 1
    pred[pred <=  0.5] = 0
    
    # Plotando a matriz de confusão
    cm = confusion_matrix(y, pred)
    cm = pd.DataFrame(cm, index = target_names, columns= target_names)

    plt.figure(figsize = (10, 10))
    sns.heatmap(cm, cmap = "Blues", linecolor = 'black', linewidths = 1, annot = True, \
                fmt = '', xticklabels = target_names, yticklabels = target_names)
    plt.show()
    
    print('AUC: %f' % roc_auc_score(y_true = y, y_score = pred))
    
    # Area sob  a curva ROC
    rfp, rvp, lim = roc_curve(y_true = y, y_score = pred)

    plt.plot(rfp, rvp, marker = '.',  label = label,  color = 'orange')
    plt.plot([0, 1],  [0, 1], color = 'darkblue', linestyle = '--')
    plt.xlabel('Especificade')
    plt.ylabel('Sensibilidade')
    plt.legend()
    plt.show()
    
    print("Acurácia: %f" % accuracy_score(y_true = y, y_pred = pred))
    
    print(classification_report(y_true = y, y_pred = pred, target_names= target_names))
    
    if save:
        shortFileName = '000'
        fileName = 'models/0001.model'
        fileObj = Path(fileName)
        
        index = 1
        while fileObj.exists():
            index += 1
            fileName = 'models/' + shortFileName + str(index) + '.model'
            fileObj = Path(fileName)
        
        # salvar modelo
        pickle.dump(modelo, open(fileName, 'wb'))
        
        return fileName


###### CRIANDO VERSÃO 01 DO MODELO
modelo_v1 = MLPClassifier(max_iter = 1000, verbose = False)
modelo_v1.fit(x_train, y_train)
preds = modelo_v1.predict(x_test)


report_modelo(modelo_v1, y_test, preds, 'Redes Neurais')

AUC: 0.675920

Acurácia: 0.744898
              precision    recall  f1-score   support

         Bad       0.88      0.79      0.83       394
        Good       0.39      0.56      0.46        96

    accuracy                           0.74       490
   macro avg       0.64      0.68      0.65       490
weighted avg       0.79      0.74      0.76       490


###### CRIANDO VERSÃO 02 DO MODELO
# Definindo parametros e configurações

'''
params = {
        'hidden_layer_sizes': [[100, 100], [100, 100, 100], [100, 100, 100, 100]],
        'activation': ['logistic', 'tanh', 'relu'],
        'solver': ['lbfgs', 'sgd', 'adam'],
        'alpha': [0.00001, 0.0001, 0.001, 0.01, 0.1],
        'learning_rate_init': [0.0001, 0.001, 0.01, 0.1],
        'max_iter': [500, 1000, 2000],
        'momentum': [1.0, 0.9, 0.8],
        'tol': [0.00001],
        'verbose': [False],
        'early_stopping': [True, False],
        'random_state': [102]
        }'''

params = {
        'hidden_layer_sizes': [[100, 100], [100, 100, 100]],
        'activation': ['logistic', 'tanh', 'relu'],
        'solver': ['adam'],
        'alpha': [0.00001, 0.0001, 0.001],
        'learning_rate_init': [0.0001, 0.001, 0.01],
        'max_iter': [1000],
        'momentum': [1.0, 0.9, 0.8],
        'tol': [0.00001],
        'verbose': [False],
        'early_stopping': [True, False],
        'random_state': [102]
        }

#  Parametros de teste
'''
params = {
        'momentum': [1.0, 0.9, 0.8],    
        'tol': [0.00001],
        'max_iter': [1000],
        'verbose': [True],
        'early_stopping': [False],
        'hidden_layer_sizes': [[100, 100]],
        'random_state': [102]
        }'''

grid = GridSearchCV(MLPClassifier(), params, n_jobs = 20)

grid.fit(x_train, y_train)

preds = grid.predict_proba(x_test)[:,1]

modelo = grid.best_estimator_


report_modelo(modelo, y_test, preds, 'Redes Neurais')

print(grid.best_params_)

# salvar modelo
pickle.dump(modelo, open('models/000x.model', 'wb'))


# carregar modelo
modelo_carregado = pickle.load(open('models/000x.model', 'rb'))
preds = modelo_carregado.predict(x_test)

fileName = report_modelo(modelo_carregado, y_test, preds, 'Redes Neurais', True)
print(fileName)


###### CRIANDO VERSÃO 2.1 DO MODELO
# Definindo parametros e configurações

params = {
        'hidden_layer_sizes': [[100, 100], [100, 100, 100], [100, 100, 100, 100]],
        'activation': ['logistic', 'tanh', 'relu'],
        'solver': ['adam'],
        'alpha': [0.0001, 0.001, 0.01],
        'learning_rate_init': [0.0001, 0.001, 0.01],
        'max_iter': [2000],
        'momentum': [1.0, 0.9],
        'tol': [0.00001],
        'verbose': [False],
        'early_stopping': [False],
        'random_state': [102]
        }

grid = GridSearchCV(MLPClassifier(), params, n_jobs = 20)

grid.fit(x_train, y_train)

preds = grid.predict_proba(x_test)[:,1]

modelo = grid.best_estimator_


report_modelo(modelo, y_test, preds, 'Redes Neurais', True)


###### CRIANDO VERSÃO 03 DO MODELO

modelo = MLPClassifier(activation = 'logistic', alpha = 1e-06, early_stopping = False,\
                       hidden_layer_sizes = [100, 100], learning_rate_init = 0.01, max_iter = 1000,\
                       momentum = 1.0, random_state = 102, solver = 'adam', tol = 1e-05, verbose = False)
modelo.fit(x_train, y_train)
preds = modelo.predict(x_test)


report_modelo(modelo, y_test, preds, 'Redes Neurais', True)

AUC: 0.696172

Acurácia: 0.840816
              precision    recall  f1-score   support

         Bad       0.88      0.93      0.90       394
        Good       0.63      0.46      0.53        96

    accuracy                           0.84       490
   macro avg       0.75      0.70      0.72       490
weighted avg       0.83      0.84      0.83       490

'models/0001.model'


###### CRIANDO VERSÃO 04 DO MODELO

modelo = MLPClassifier(activation = 'logistic', alpha = 1e-07, early_stopping = False,\
                       hidden_layer_sizes = [100, 100], learning_rate_init = 0.01, max_iter = 1000,\
                       momentum = 1.0, random_state = 102, solver = 'adam', tol = 1e-05, verbose = False)
modelo.fit(x_train, y_train)
preds = modelo.predict(x_test)


report_modelo(modelo, y_test, preds, 'Redes Neurais', True)

AUC: 0.731625

Acurácia: 0.840816
              precision    recall  f1-score   support

         Bad       0.89      0.91      0.90       394
        Good       0.60      0.55      0.58        96

    accuracy                           0.84       490
   macro avg       0.75      0.73      0.74       490
weighted avg       0.84      0.84      0.84       490

'models/0002.model'


###### CRIANDO VERSÃO 05 DO MODELO

modelo = MLPClassifier(activation = 'logistic', alpha = 1e-07, early_stopping = False,\
                       hidden_layer_sizes = [100, 100], learning_rate_init = 0.0035, max_iter = 1000,\
                       momentum = 1.0, random_state = 102, solver = 'adam', tol = 1e-10, verbose = False)
modelo.fit(x_train, y_train)
preds = modelo.predict(x_test)


report_modelo(modelo, y_test, preds, 'Redes Neurais', True)

AUC: 0.717269

Acurácia: 0.836735
              precision    recall  f1-score   support

         Bad       0.89      0.91      0.90       394
        Good       0.60      0.52      0.56        96

    accuracy                           0.84       490
   macro avg       0.74      0.72      0.73       490
weighted avg       0.83      0.84      0.83       490

'models/0003.model'


###### CRIANDO VERSÃO 06 DO MODELO

modelo = MLPClassifier(activation = 'logistic', alpha = 1e-07, early_stopping = False,\
                       hidden_layer_sizes = [100, 100], learning_rate_init = 0.0050, max_iter = 1000,\
                       momentum = 1.0, random_state = 102, solver = 'adam', tol = 1e-10, verbose = False)
modelo.fit(x_train, y_train)
preds = modelo.predict(x_test)


report_modelo(modelo, y_test, preds, 'Redes Neurais', True)

AUC: 0.714996

Acurácia: 0.820408
              precision    recall  f1-score   support

         Bad       0.89      0.89      0.89       394
        Good       0.54      0.54      0.54        96

    accuracy                           0.82       490
   macro avg       0.71      0.71      0.71       490
weighted avg       0.82      0.82      0.82       490

'models/0004.model'


shap.initjs()

explainer = shap.KernelExplainer(modelo.predict_proba, x_train)
shap_values = explainer.shap_values(x_test[0:100,:])

Using 7248 background data samples could cause slower run times. Consider using shap.sample(data, K) or shap.kmeans(data, K) to summarize the background as K samples.


column_names = ['chlorides', 'residual sugar', 'citric acid', 'free sulfur dioxide', 'volatile acidity', 'alcohol']


shap.force_plot(explainer.expected_value[1], shap_values[1][0,:], x_test[0,], feature_names = column_names)


shap.force_plot(explainer.expected_value[0], shap_values[0], x_test[0:100,:], feature_names = column_names)


shap.summary_plot(shap_values[0], x_test[0:100,:], feature_names = column_names)


###### CRIANDO VERSÃO 07 DO MODELO

modelo = MLPClassifier(activation = 'logistic', alpha = 1e-07, early_stopping = False,\
                       hidden_layer_sizes = [100, 100], learning_rate_init = 0.0025, max_iter = 2000,\
                       momentum = 1.0, random_state = 102, solver = 'adam', tol = 1e-10, verbose = False)
modelo.fit(x_train, y_train)
preds = modelo.predict(x_test)


report_modelo(modelo, y_test, preds, 'Redes Neurais', True)

AUC: 0.722742

Acurácia: 0.826531
              precision    recall  f1-score   support

         Bad       0.89      0.89      0.89       394
        Good       0.56      0.55      0.55        96

    accuracy                           0.83       490
   macro avg       0.72      0.72      0.72       490
weighted avg       0.83      0.83      0.83       490

'models/0005.model'


###### CRIANDO VERSÃO 08 DO MODELO

modelo = MLPClassifier(activation = 'logistic', alpha = 1e-07, early_stopping = False,\
                       hidden_layer_sizes = [100, 100], learning_rate_init = 0.0025, max_iter = 5000,\
                       momentum = 1.0, random_state = 102, solver = 'adam', tol = 1e-10, n_iter_no_change = 100, \
                       verbose = False)
modelo.fit(x_train, y_train)
preds = modelo.predict(x_test)


report_modelo(modelo, y_test, preds, 'Redes Neurais', True)

AUC: 0.720204

Acurácia: 0.822449
              precision    recall  f1-score   support

         Bad       0.89      0.89      0.89       394
        Good       0.55      0.55      0.55        96

    accuracy                           0.82       490
   macro avg       0.72      0.72      0.72       490
weighted avg       0.82      0.82      0.82       490

'models/0006.model'


###### CRIANDO VERSÃO 09 DO MODELO

modelo = MLPClassifier(activation = 'logistic', alpha = 1e-07, early_stopping = False,\
                       hidden_layer_sizes = [100, 100], learning_rate_init = 0.0025, max_iter = 5000,\
                       momentum = 1.0, random_state = 102, solver = 'adam', tol = 1e-10, n_iter_no_change = 100, \
                       verbose = False)
modelo.fit(x_train, y_train)
preds = modelo.predict(x_test)


report_modelo(modelo, y_test, preds, 'Redes Neurais', True)

AUC: 0.720204

Acurácia: 0.822449
              precision    recall  f1-score   support

         Bad       0.89      0.89      0.89       394
        Good       0.55      0.55      0.55        96

    accuracy                           0.82       490
   macro avg       0.72      0.72      0.72       490
weighted avg       0.82      0.82      0.82       490

'models/0007.model'


###### CRIANDO VERSÃO 10 DO MODELO

modelo = MLPClassifier(activation = 'logistic', alpha = 1e-07, early_stopping = False,\
                       hidden_layer_sizes = [100, 100], learning_rate_init = 0.001, max_iter = 5000,\
                       momentum = 1.0, random_state = 102, solver = 'adam', tol = 1e-20, n_iter_no_change = 250, \
                       verbose = False)
modelo.fit(x_train, y_train)
preds = modelo.predict(x_test)

Stochastic Optimizer: Maximum iterations (5000) reached and the optimization hasn't converged yet.


report_modelo(modelo, y_test, preds, 'Redes Neurais', True)

AUC: 0.762743

Acurácia: 0.859184
              precision    recall  f1-score   support

         Bad       0.91      0.92      0.91       394
        Good       0.65      0.60      0.63        96

    accuracy                           0.86       490
   macro avg       0.78      0.76      0.77       490
weighted avg       0.86      0.86      0.86       490

'models/0008.model'


shap.initjs()

explainer = shap.KernelExplainer(modelo.predict_proba, x_train)
shap_values = explainer.shap_values(x_test[0:100,:])

Using 7248 background data samples could cause slower run times. Consider using shap.sample(data, K) or shap.kmeans(data, K) to summarize the background as K samples.


column_names = ['chlorides', 'residual sugar', 'citric acid', 'free sulfur dioxide', 'volatile acidity', 'alcohol']


shap.force_plot(explainer.expected_value[1], shap_values[1][0,:], x_test[0,], feature_names = column_names)


shap.force_plot(explainer.expected_value[0], shap_values[0], x_test[0:100,:], feature_names = column_names)


shap.summary_plot(shap_values[0], x_test[0:100,:], feature_names = column_names)


# Transformando os dados em DMatrix pois o XGBoost exige
dtrain = xgb.DMatrix(x_train, label = y_train)
dtest = xgb.DMatrix(x_test, label = y_test)


# Definindo parametros e configurações
param = {}
num_round = 2


# Treinando versão 1
modelo_v1 = xgb.train(params = param, dtrain = dtrain)


# Realizando previsões
preds = modelo_v1.predict(dtest)


report_modelo(modelo_v1, y_test, preds)

AUC: 0.704235

Acurácia: 0.771429
              precision    recall  f1-score   support

         Bad       0.89      0.81      0.85       394
        Good       0.44      0.59      0.50        96

    accuracy                           0.77       490
   macro avg       0.67      0.70      0.68       490
weighted avg       0.80      0.77      0.78       490


# Definindo parametros e configurações
param = {'nthread':  20}
num_round = 100


# Treinando versão 2
modelo_v2 = xgb.train(params = param, dtrain = dtrain, num_boost_round = num_round)


# Realizando previsões
preds = modelo_v2.predict(dtest)


report_modelo(modelo_v2, y_test, preds)

AUC: 0.696172

Acurácia: 0.840816
              precision    recall  f1-score   support

         Bad       0.88      0.93      0.90       394
        Good       0.63      0.46      0.53        96

    accuracy                           0.84       490
   macro avg       0.75      0.70      0.72       490
weighted avg       0.83      0.84      0.83       490


print(y_train)

[0 0 0 ... 1 1 1]


# Definindo parametros e configurações

param = {
        'min_child_weight': [1, 5, 10],
        'gamma': [0.5, 1, 1.5, 2, 5],
        'subsample': [0.6, 0.8, 1.0],
        'colsample_bytree': [0.6, 0.8, 1.0],
        'max_depth': [3, 4, 5],
        'learning_rate': [0.3, 0.2, 0.1, 0.05],
        'nthread': [2],
        'num_round': [100]
        }

'''
param = {
        'nthread': [1],
        'num_round': [3]
        }
'''

num_round = 100

# Treinando versão 3
modelo = xgb.XGBClassifier(use_label_encoder = False)

grid = GridSearchCV(modelo, param_grid = param,  n_jobs = 20, scoring='roc_auc')

grid.fit(x_train, y_train)

preds = grid.predict_proba(x_test)[:,1]

modelo = grid.best_estimator_

report_modelo(modelo, y_test, preds)

print(grid.best_params_)

modelo.save_model('models/0002.model')


modelo = xgb.Booster({'nthread': 4})  # init model
modelo.load_model('models/0001.model')  # load data


preds = modelo.predict(dtest)

print(preds)

report_modelo(modelo, y_test, preds)


# Definindo parametros e configurações

param = {
        'min_child_weight': [1, 5, 10],
        'gamma': [0.5, 1, 1.5, 2, 5],
        'subsample': [0.6, 0.8, 1.0, 1.2, 1.4],
        'colsample_bytree': [0.8, 1.0, 1.2, 1.4],
        'max_depth': [4, 5, 6, 7],
        'learning_rate': [0.4, 0.3, 0.2, 0.1],
        'nthread': [2],
        'num_round': [100]
        }

'''
param = {
        'nthread': [1],
        'num_round': [3]
        }
'''

num_round = 100

# Treinando versão 4
modelo = xgb.XGBClassifier(use_label_encoder = False)

grid = GridSearchCV(modelo, param_grid = param,  n_jobs = 20, scoring='roc_auc')

grid.fit(x_train, y_train)

preds = grid.predict_proba(x_test)[:,1]

modelo = grid.best_estimator_

report_modelo(modelo, y_test, preds)

print(grid.best_params_)

modelo.save_model('models/0003.model')


# Definindo parametros e configurações

param = {
        'min_child_weight': [1, 5, 10],
        'gamma': [0.125, 0.25, 0.5, 1, 1.5, 2],
        'subsample': [0.6, 0.8, 1.0, 1.2],
        'colsample_bytree': [0.4, 0.6, 0.8, 1.0],
        'max_depth': [5, 6, 7, 8, 9],
        'learning_rate': [0.4, 0.3, 0.2, 0.1],
        'nthread': [2],
        'num_round': [100]
        }

# Treinando versão 5
modelo = xgb.XGBClassifier(use_label_encoder = False)

grid = GridSearchCV(modelo, param_grid = param,  n_jobs = 20, scoring='roc_auc')

grid.fit(x_train, y_train)

preds = grid.predict_proba(x_test)[:,1]

modelo = grid.best_estimator_

report_modelo(modelo, y_test, preds)

print(grid.best_params_)

modelo.save_model('models/0004.model')


# Definindo parametros e configurações
param = {
        'min_child_weight': [1, 5, 10],
        'gamma': [0.125, 0.25, 0.5, 1, 1.5, 2],
        'subsample': [0.6, 0.8, 1.0, 1.2],
        'colsample_bytree': [0.4, 0.6, 0.8, 1.0, 1.1],
        'max_depth': [6, 7, 8, 9, 10, 11],
        'learning_rate': [0.4, 0.3, 0.2, 0.1],
        'nthread': [2],
        'num_round': [100]
        }

# Treinando versão 5
modelo = xgb.XGBClassifier(use_label_encoder = False)

grid = GridSearchCV(modelo, param_grid = param,  n_jobs = 20, scoring='roc_auc')

grid.fit(x_train, y_train)

preds = grid.predict_proba(x_test)[:,1]

modelo = grid.best_estimator_

report_modelo(modelo, y_test, preds)

print(grid.best_params_)

modelo.save_model('models/0005.model')

	fixed acidity	volatile acidity	citric acid	residual sugar	chlorides	free sulfur dioxide	total sulfur dioxide	density	pH	sulphates	alcohol	quality
0	7.0	0.27	0.36	20.7	0.045	45.0	170.0	1.0010	3.00	0.45	8.8	6
1	6.3	0.30	0.34	1.6	0.049	14.0	132.0	0.9940	3.30	0.49	9.5	6
2	8.1	0.28	0.40	6.9	0.050	30.0	97.0	0.9951	3.26	0.44	10.1	6
3	7.2	0.23	0.32	8.5	0.058	47.0	186.0	0.9956	3.19	0.40	9.9	6
4	7.2	0.23	0.32	8.5	0.058	47.0	186.0	0.9956	3.19	0.40	9.9	6

	fixed acidity	volatile acidity	citric acid	residual sugar	chlorides	free sulfur dioxide	total sulfur dioxide	density	pH	sulphates	alcohol	quality
count	4898.000000	4898.000000	4898.000000	4898.000000	4898.000000	4898.000000	4898.000000	4898.000000	4898.000000	4898.000000	4898.000000	4898.000000
mean	6.854788	0.278241	0.334192	6.391415	0.045772	35.308085	138.360657	0.994027	3.188267	0.489847	10.514267	5.877909
std	0.843868	0.100795	0.121020	5.072058	0.021848	17.007137	42.498065	0.002991	0.151001	0.114126	1.230621	0.885639
min	3.800000	0.080000	0.000000	0.600000	0.009000	2.000000	9.000000	0.987110	2.720000	0.220000	8.000000	3.000000
25%	6.300000	0.210000	0.270000	1.700000	0.036000	23.000000	108.000000	0.991723	3.090000	0.410000	9.500000	5.000000
50%	6.800000	0.260000	0.320000	5.200000	0.043000	34.000000	134.000000	0.993740	3.180000	0.470000	10.400000	6.000000
75%	7.300000	0.320000	0.390000	9.900000	0.050000	46.000000	167.000000	0.996100	3.280000	0.550000	11.400000	6.000000
max	14.200000	1.100000	1.660000	65.800000	0.346000	289.000000	440.000000	1.038980	3.820000	1.080000	14.200000	9.000000

	fixed acidity	volatile acidity	citric acid	residual sugar	chlorides	free sulfur dioxide	total sulfur dioxide	density	pH	sulphates	alcohol	quality
fixed acidity	1.000000	-0.022697	0.289181	0.089021	0.023086	-0.049396	0.091070	0.265331	-0.425858	-0.017143	-0.120881	-0.113663
volatile acidity	-0.022697	1.000000	-0.149472	0.064286	0.070512	-0.097012	0.089261	0.027114	-0.031915	-0.035728	0.067718	-0.194723
citric acid	0.289181	-0.149472	1.000000	0.094212	0.114364	0.094077	0.121131	0.149503	-0.163748	0.062331	-0.075729	-0.009209
residual sugar	0.089021	0.064286	0.094212	1.000000	0.088685	0.299098	0.401439	0.838966	-0.194133	-0.026664	-0.450631	-0.097577
chlorides	0.023086	0.070512	0.114364	0.088685	1.000000	0.101392	0.198910	0.257211	-0.090439	0.016763	-0.360189	-0.209934
free sulfur dioxide	-0.049396	-0.097012	0.094077	0.299098	0.101392	1.000000	0.615501	0.294210	-0.000618	0.059217	-0.250104	0.008158
total sulfur dioxide	0.091070	0.089261	0.121131	0.401439	0.198910	0.615501	1.000000	0.529881	0.002321	0.134562	-0.448892	-0.174737
density	0.265331	0.027114	0.149503	0.838966	0.257211	0.294210	0.529881	1.000000	-0.093591	0.074493	-0.780138	-0.307123
pH	-0.425858	-0.031915	-0.163748	-0.194133	-0.090439	-0.000618	0.002321	-0.093591	1.000000	0.155951	0.121432	0.099427
sulphates	-0.017143	-0.035728	0.062331	-0.026664	0.016763	0.059217	0.134562	0.074493	0.155951	1.000000	-0.017433	0.053678
alcohol	-0.120881	0.067718	-0.075729	-0.450631	-0.360189	-0.250104	-0.448892	-0.780138	0.121432	-0.017433	1.000000	0.435575
quality	-0.113663	-0.194723	-0.009209	-0.097577	-0.209934	0.008158	-0.174737	-0.307123	0.099427	0.053678	0.435575	1.000000

	chlorides	residual sugar	citric acid	free sulfur dioxide	volatile acidity	alcohol	quality
0	0.045	5.2	0.36	45.0	0.27	8.8	6.0
1	0.049	1.6	0.34	14.0	0.30	9.5	6.0
2	0.050	6.9	0.40	30.0	0.28	10.1	6.0
3	0.058	8.5	0.32	47.0	0.23	9.9	6.0
4	0.058	8.5	0.32	47.0	0.23	9.9	6.0

	chlorides	residual sugar	citric acid	free sulfur dioxide	volatile acidity	alcohol
0	0.045	5.2	0.36	45.0	0.27	8.8
1	0.049	1.6	0.34	14.0	0.30	9.5
2	0.050	6.9	0.40	30.0	0.28	10.1
3	0.058	8.5	0.32	47.0	0.23	9.9
4	0.058	8.5	0.32	47.0	0.23	9.9

Definindo o problema de negócio¶

Variáveis da base¶

Imports¶

Analise Exploratoria¶

Analise Exploratoria - Sem Processamento¶

Avaliando MultiColinearidade¶

Pre-Processamento¶

Detectando e Removendo Outliers¶

Feature Selecting¶

Normalizando/Padronização¶

Transformando os Dados¶

BALANCEANDO OS DADOS¶

OVERSAMPLING BASICO¶

SMOTE¶

Treinando Modelos¶

Redes Neurais - MLPClassifier¶

XGBOOST¶