Structured Data Classification Fresco Play Hands-on Solutions

Course Path: Data Science/MACHINE LEARNING METHODS/Structured Data Classification

Welcome to Structured Data Classification(75 Min)

File Name:Structured_test

Step 1: - 

import pandas as pd

import numpy as np

import dataframe as df

Step 2:- 

weather = pd.read_csv('weather.csv', sep=',')

Step 3:- 



weather_col_names = list(weather.columns)




Step 4:-



Step 5:-

cols_to_drop = ['Date','RainTomorrow']

weather_feature = weather.drop(cols_to_drop,axis = 1)


Step 6: -

weather_categorical = weather.select_dtypes(include=[object])


Step 7:- 

yes_no_cols = ["RainToday"]

weather_feature[yes_no_cols] = weather_feature[yes_no_cols] == 'Yes'


Step 8:-

weather_dumm=pd.get_dummies(weather_feature, columns=["Location","WindGustDir","WindDir9am","WindDir3pm"], prefix=["Location","WindGustDir","WindDir9am","WindDir3pm"])

weather_matrix = weather_dumm.values.astype(np.float)

Step 9:- 

from sklearn.impute import SimpleImputer

imp=SimpleImputer(missing_values=np.nan,strategy='mean', fill_value=None,verbose=0,copy=True)


Step 10:-

from sklearn.preprocessing import StandardScaler

#Standardize the data by removing the mean and scaling to unit variance

scaler = StandardScaler()

#Fit to data, then transform it.

weather_matrix = scaler.fit_transform(weather_matrix)

Step 11:- 

from sklearn.model_selection import train_test_split


train_data,test_data, train_label, test_label = train_test_split(weather_matrix,weather_target,test_size=0.1,random_state = seed)

Step 12:- 

from sklearn.svm import SVC

classifier = SVC(kernel="linear",C=0.025,random_state=seed )

classifier =,train_label)


score = classifier.score(test_data,test_label)

print('SVM Classifier : ',score)

with open('output.txt', 'w') as file:


Step 13:- 

from sklearn.ensemble import RandomForestClassifier

classifier = RandomForestClassifier(max_depth=5,n_estimators=10,max_features=10,random_state=seed)

classifier =,train_label)


score = classifier.score(test_data,test_label)

print('Random Forest Classifier : ',score)

with open('output1.txt', 'w') as file:


