#numpy dizileri dataframe donusumu
Explore tagged Tumblr posts
warforcoding-blog · 7 years ago
Text
Veri Analizi Proje Yönetimi ve Problem Tipleri
#1. kutuphaneler import numpy as np import matplotlib.pyplot as plt import pandas as pd
#2.1. Veri Yukleme veriler = pd.read_csv('dosya_adı.csv') #pd.read_csv("veriler.csv")
#eksik veriler
from sklearn.preprocessing import Imputer
imputer= Imputer(missing_values='NaN', strategy = 'mean', axis=0 )    
Yas = veriler.iloc[:,1:4].values print(Yas) imputer = imputer.fit(Yas[:,1:4]) Yas[:,1:4] = imputer.transform(Yas[:,1:4]) print(Yas)
#encoder:  Kategorik -> Numeric ulke = veriler.iloc[:,0:1].values print(ulke) from sklearn.preprocessing import LabelEncoder le = LabelEncoder() ulke[:,0] = le.fit_transform(ulke[:,0]) print(ulke)
from sklearn.preprocessing import OneHotEncoder ohe = OneHotEncoder(categorical_features='all') ulke=ohe.fit_transform(ulke).toarray() print(ulke)
#numpy dizileri dataframe donusumu sonuc = pd.DataFrame(data = ulke, index = range(22), columns=['fr','tr','us'] ) print(sonuc)
sonuc2 =pd.DataFrame(data = Yas, index = range(22), columns = ['boy','kilo','yas']) print(sonuc2)
cinsiyet = veriler.iloc[:,-1].values print(cinsiyet)
sonuc3 = pd.DataFrame(data = cinsiyet , index=range(22), columns=['cinsiyet']) print(sonuc3)
#dataframe birlestirme islemi s=pd.concat([sonuc,sonuc2],axis=1) print(s)
s2= pd.concat([s,sonuc3],axis=1) print(s2)
#verilerin egitim ve test icin bolunmesi from sklearn.cross_validation import train_test_split x_train, x_test,y_train,y_test = train_test_split(s,sonuc3,test_size=0.33, random_state=0)
#verilerin olceklenmesi from sklearn.preprocessing import StandardScaler
sc = StandardScaler() X_train = sc.fit_transform(x_train) X_test = sc.fit_transform(x_test)
0 notes