#1 import pandas as pd
#2 import numpy as np
#3 import matplotlib.pyplot as plt
#4 import seaborn as sns
#5 df=pd.read_csv("C:/Users/lucy8/PycharmProjects/test2/DSOB/train.csv")
#6 print(df.head(3))
#7 print(df.shape)
#8 print(df.isnull().sum())
#9 print(df.info())
df ํ์ผ์ ํ ๋น๋ ๋ฐ์ดํฐ ์ค์ 3๊ฐ๋ฅผ ๋ฝ์, ๋ฐ์ดํฐ์ ํํ ๋ฑ์ ํ์ ํจ
์ข(7ํ,8ํ)๋ ๋ฐ์ดํฐ์ ๊ฐ์๋ฅผ ํ๋ ฌ๋ก ์๋ ค์ฃผ๊ณ , null๊ฐ์ด ์๋์ง ์๋ ค์ค (null๊ฐ์ด ์๋ค๋ฉด, ํด๊ฒฐํด์ผํจ (ํ๊ท ,์ญ์ ๋ฑ))
์ฐ(9ํ)๋ ๋ฐ์ดํฐ ํ์ ์ ์๋ ค์ค
#10 num_type = df['type'].unique()
#11 print(num_type)
#12 print(len(num_type))
#13 fiberid_type = df['fiberID'].unique()
#14 print(fiberid_type)
#15 print(len(fiberid_type))
#16 numerical_columns=['psfMag_u','psfMag_g','psfMag_r','psfMag_i', 'psfMag_z','fiberMag_u','fiberMag_g','fiberMag_r','fiberMag_i','fiberMag_z','petroMag_u','petroMag_g','petroMag_r','petroMag_i','petroMag_z','modelMag_u','modelMag_g']
#17 corr = df[numerical_columns].corr(method = 'pearson')
print(corr)
#18 fig = plt.figure(figsize = (12, 8))
ax = fig.gca()
#19 sns.set(font_scale = 1.5) # heatmap ์์ font-size ์ค์
heatmap = sns.heatmap(corr.values, annot = True, fmt='.2f', annot_kws={'size':15},
yticklabels = numerical_columns, xticklabels = numerical_columns, ax=ax, cmap = "RdYlBu")
plt.tight_layout()
plt.show
#20 plt.boxplot(df['fiberMag_u'])
#21 plt.boxplot(df['petroMag_u'])
plt.show()
#22 numerical_columns=['psfMag_u','psfMag_g','psfMag_r','psfMag_i','psfMag_z','fiberMag_u','fiberMag_g','fiberMag_r','fiberMag_i','fiberMag_z','petroMag_u','petroMag_g','petroMag_r','petroMag_i','petroMag_z','modelMag_u','modelMag_g']
fig =plt.figure(figsize = (20, 20))
ax = fig.gca()
df[numerical_columns].hist(ax=ax)
plt.show()
์ ์๋ฏธํ ์ปฌ๋ผ๋ค์ ๋ฐ๋ก ๋ชจ์ ํ, ์๊ด๊ด๊ณ๋ฅผ -1๋ถํฐ 1๊น์ง ๋ํ๋ด๋ ์๊ฐํ
์๊ด๊ด๊ณ๋ฅผ ์๊ฐํ ํ ํํธ๋งต
๋นจ๊ฐ๊ฐ๊ณผ ํ๋๊ฐ์ ๊ฐ๋ ์ปฌ๋ผ์ ๋ฐ์คํ๋กฏ
'๐ก WIDA > DACON ๋ถ๋ฅ-ํ๊ท' ์นดํ ๊ณ ๋ฆฌ์ ๋ค๋ฅธ ๊ธ
[DACON/๊น๊ท๋ฆฌ] ํ์ด์ฌ์ ์ด์ฉํ EDA (0) | 2023.04.07 |
---|---|
[DACON/๊น๊ฒฝ์] ํ์ด์ฌ์ ์ด์ฉํ EDA (0) | 2023.04.07 |
[DACON/์กฐ์์] ํ์ด์ฌ์ ์ด์ฉํ EDA (0) | 2023.04.07 |
[DACON/๊น๋ฏผํ] ํ์ด์ฌ์ ์ด์ฉํ EDA (0) | 2023.04.07 |
[DACON/๊น์ธ์ฐ] ๋ถ๋ฅ ๋ชจ๋ธ ๋ฏ์ด๋ณด๊ธฐ, ๋ถ๋ฅ ๋ชจ๋ธ ํ๊ฐ๋ฐฉ์ (0) | 2023.03.31 |