資料集是UCI網站獲得,為五年内印第安人糖尿病的醫療資料
- -----------------------------------------------采用python類庫導入資料-----------------------------------------------------------
from csv import reader
import numpy as np
filename = 'pima.csv'
with open(filename, 'rt') as raw_data:
readers = reader(raw_data, delimiter=',')
x = list(readers)
data = np.array(x).astype('float')
print(data.shape)
- -----------------------------------------------采用numpy導入資料---------------------------------------------------------------
from numpy import loadtxt
filename = 'pima.csv'
with open(filename, 'rt') as raw_data:
data = loadtxt(raw_data, delimiter=',')
print(data.shape)
- -----------------------------------------------采用pandas導入資料---------------------------------------------------------------
推薦使用
from pandas import read_csv
filename = 'pima.csv'
names = ['preg','plas','pres','skin','test','mass','pedi','age','class']
data = read_csv(filename,names=names)
print(data.shape)