import matplotlib.pyplot as plt
%matplotlib inline

#그래프 데이터 
subject = ['English', 'Math', 'Korean', 'Science', 'Computer']
points = [40, 90, 50, 60, 100]

# 축 그리기
fig = plt.figure()            # 도화지 펼치기 
ax1 = fig.add_subplot(1,1,1)  # 1행 1열로 1개 그릴수 있다는 뜻

# 그래프 그리기
ax1.bar(subject, points)

# 라벨, 타이틀 달기
plt.xlabel('Subject')
plt.ylabel('Points')
plt.title("Yuna's Test Result")

# 보여주기
plt.savefig('./barplot.png')  # 그래프를 이미지로 출력
plt.show()                    # 그래프를 화면으로 출력


from datetime import datetime
import pandas as pd
import os

#그래프 데이터 
csv_path = os.getenv("HOME") + "/aiffel/data_represent/data/AMZN.csv"
data = pd.read_csv(csv_path ,index_col=0, parse_dates=True)
price = data['Close']

# 축 그리기 및 좌표축 설정
fig = plt.figure()
ax = fig.add_subplot(1,1,1)
price.plot(ax=ax, style='black')  # subplot을 사용한다
plt.ylim([1600,2200])
plt.xlim(['2019-05-01','2020-03-01'])

# 주석달기
important_data = [(datetime(2019, 6, 3), "Low Price"),(datetime(2020, 2, 19), "Peak Price")]
for d, label in important_data:
    ax.annotate(label, xy=(d, price.asof(d)+10), 
                xytext=(d,price.asof(d)+100),
                arrowprops=dict(facecolor='red'))

# 그리드, 타이틀 달기
plt.grid()    # 격자눈금 추가
ax.set_title('StockPrice')

# 보여주기
plt.show()


import numpy as np
x = np.linspace(0, 10, 100) 
plt.plot(x, np.sin(x),'o')
plt.plot(x, np.cos(x),'--', color='black') 
plt.show()


x = np.linspace(0, 10, 100) 

plt.subplot(2,1,1)
plt.plot(x, np.sin(x),'orange','o')

plt.subplot(2,1,2)
plt.plot(x, np.cos(x), 'orange') 
plt.show()


# linestyle, marker옵션
x = np.linspace(0, 10, 100) 

plt.plot(x, x + 0, linestyle='solid') 
plt.plot(x, x + 1, linestyle='dashed') 
plt.plot(x, x + 2, linestyle='dashdot') 
plt.plot(x, x + 3, linestyle='dotted')
plt.plot(x, x + 0, '-g') # solid green 
plt.plot(x, x + 1, '--c') # dashed cyan 
plt.plot(x, x + 2, '-.k') # dashdot black 
plt.plot(x, x + 3, ':r'); # dotted red
plt.plot(x, x + 4, linestyle='-') # solid 
plt.plot(x, x + 5, linestyle='--') # dashed 
plt.plot(x, x + 6, linestyle='-.') # dashdot 
plt.plot(x, x + 7, linestyle=':'); # dotted


fig, axes = plt.subplots(2, 1)
data = pd.Series(np.random.rand(5), index=list('abcde'))
data.plot(kind='bar', ax=axes[0], color='blue', alpha=1)
data.plot(kind='barh', ax=axes[1], color='red', alpha=0.3)

<AxesSubplot:>


df = pd.DataFrame(np.random.rand(6,4), columns=pd.Index(['A','B','C','D']))
df.plot(kind='line')

<AxesSubplot:>


import pandas as pd
import seaborn as sns

tips = sns.load_dataset("tips")


df = pd.DataFrame(tips)
df.head()


df.shape

(244, 7)


df.describe()


df.info()

<class 'pandas.core.frame.DataFrame'>
RangeIndex: 244 entries, 0 to 243
Data columns (total 7 columns):
 #   Column      Non-Null Count  Dtype   
---  ------      --------------  -----   
 0   total_bill  244 non-null    float64 
 1   tip         244 non-null    float64 
 2   sex         244 non-null    category
 3   smoker      244 non-null    category
 4   day         244 non-null    category
 5   time        244 non-null    category
 6   size        244 non-null    int64   
dtypes: category(4), float64(2), int64(1)
memory usage: 7.3 KB


print(df['sex'].value_counts())
print("===========================")


print(df['time'].value_counts())
print("===========================")


print(df['smoker'].value_counts())
print("===========================")


print(df['day'].value_counts())
print("===========================")


print(df['size'].value_counts())
print("===========================")

Male      157
Female     87
Name: sex, dtype: int64
===========================
Dinner    176
Lunch      68
Name: time, dtype: int64
===========================
No     151
Yes     93
Name: smoker, dtype: int64
===========================
Sat     87
Sun     76
Thur    62
Fri     19
Name: day, dtype: int64
===========================
2    156
3     38
4     37
5      5
6      4
1      4
Name: size, dtype: int64
===========================


# matplotlib에 데이터를 인자로 넣기 위해선 pandas 데이터를 바로 이용할 수는 없으므로 데이터를 x, y에 series, list 형태로 각각 나눠주어야함.
grouped = df['tip'].groupby(df['sex'])


grouped.mean() # 성별에 따른 팁의 평균

sex
Male      3.089618
Female    2.833448
Name: tip, dtype: float64


grouped.size() # 성별에 따른 데이터 량(팁 횟수)

sex
Male      157
Female     87
Name: tip, dtype: int64


import numpy as np
sex = dict(grouped.mean())
x = list(sex.keys())
y = list(sex.values())

plt.bar(x, y)
plt.ylabel('tip[$]')
plt.title('Tip by Sex')
#plt.legend()

Text(0.5, 1.0, 'Tip by Sex')


sns.barplot(data=df, x='sex', y='tip')

<AxesSubplot:xlabel='sex', ylabel='tip'>


plt.figure(figsize=(10,6))
sns.barplot(data=df, x='sex', y='tip')
plt.ylim(0, 4)
plt.title('Tip by sex')

Text(0.5, 1.0, 'Tip by sex')


plt.figure(figsize=(10,6))
sns.barplot(data=df, x='day', y='tip')
plt.ylim(0, 4)
plt.title('Tip by day')

Text(0.5, 1.0, 'Tip by day')


fig = plt.figure(figsize=(13,10))
ax1 = fig.add_subplot(2,2,1)
sns.barplot(data=df, x='day', y='tip',palette="ch:.25")
ax2 = fig.add_subplot(2,2,2)
sns.barplot(data=df, x='sex', y='tip')
ax3 = fig.add_subplot(2,2,4)
sns.violinplot(data=df, x='sex', y='tip')
ax3 = fig.add_subplot(2,2,3)
sns.violinplot(data=df, x='day', y='tip',palette="ch:.25")

<AxesSubplot:xlabel='day', ylabel='tip'>


sns.catplot(x="day", y="tip", jitter=False, data=tips)

<seaborn.axisgrid.FacetGrid at 0x7f7bda1f0b50>


sns.scatterplot(data=df , x='total_bill', y='tip', palette="ch:r=-.2,d=.3_r")

<AxesSubplot:xlabel='total_bill', ylabel='tip'>


sns.scatterplot(data=df , x='total_bill', y='tip', hue='day')

<AxesSubplot:xlabel='total_bill', ylabel='tip'>


x = np.linspace(0, 10, 100) 
plt.plot(x, np.sin(x), 'o')
plt.plot(x, np.cos(x)) 
plt.show()


sns.lineplot(x, np.sin(x))
sns.lineplot(x, np.cos(x))

/home/ssac24/anaconda3/envs/aiffel/lib/python3.7/site-packages/seaborn/_decorators.py:43: FutureWarning: Pass the following variables as keyword args: x, y. From version 0.12, the only valid positional argument will be `data`, and passing other arguments without an explicit keyword will result in an error or misinterpretation.
  FutureWarning
/home/ssac24/anaconda3/envs/aiffel/lib/python3.7/site-packages/seaborn/_decorators.py:43: FutureWarning: Pass the following variables as keyword args: x, y. From version 0.12, the only valid positional argument will be `data`, and passing other arguments without an explicit keyword will result in an error or misinterpretation.
  FutureWarning

<AxesSubplot:>


#그래프 데이터 
mu1, mu2, sigma = 100, 130, 15              # x1,x2 의 평균은 100, 130
x1 = mu1 + sigma*np.random.randn(10000)
x2 = mu2 + sigma*np.random.randn(10000)

# 축 그리기
fig = plt.figure()
ax1 = fig.add_subplot(1,1,1)

# 그래프 그리기 / 도수를 50개의 구간으로 표시하며, 확률 밀도가 아닌 빈도로 표기
patches = ax1.hist(x1, bins=50, density=False)
patches = ax1.hist(x2, bins=50, density=False, alpha=0.5)
ax1.xaxis.set_ticks_position('bottom')
ax1.yaxis.set_ticks_position('left')

# 라벨, 타이틀 달기
plt.xlabel('Bins')
plt.ylabel('Number of Values in Bin')
ax1.set_title('Two Frequency Distributions')

# 보여주기
plt.show()


sns.distplot(df['total_bill'])
sns.distplot(df['tip'])

/home/ssac24/anaconda3/envs/aiffel/lib/python3.7/site-packages/seaborn/distributions.py:2557: FutureWarning: `distplot` is a deprecated function and will be removed in a future version. Please adapt your code to use either `displot` (a figure-level function with similar flexibility) or `histplot` (an axes-level function for histograms).
  warnings.warn(msg, FutureWarning)
/home/ssac24/anaconda3/envs/aiffel/lib/python3.7/site-packages/seaborn/distributions.py:2557: FutureWarning: `distplot` is a deprecated function and will be removed in a future version. Please adapt your code to use either `displot` (a figure-level function with similar flexibility) or `histplot` (an axes-level function for histograms).
  warnings.warn(msg, FutureWarning)

<AxesSubplot:xlabel='tip', ylabel='Density'>


# 전체 결제 금액 대비 팁의 비율
df['tip_pct'] = df['tip'] / df['total_bill']
df['tip_pct'].hist(bins=50)

<AxesSubplot:>


# KDE(Kernel Density Estimate) 커널 밀도 추정 그래프로 표현
df['tip_pct'].plot(kind='kde')

<AxesSubplot:ylabel='Density'>


csv_path = os.getenv("HOME") + "/aiffel/data_represent/data/flights.csv"
data = pd.read_csv(csv_path)
flights = pd.DataFrame(data)
flights


sns.barplot(data=flights, x='year', y='passengers')

<AxesSubplot:xlabel='year', ylabel='passengers'>


sns.pointplot(data=flights, x='year', y='passengers')

<AxesSubplot:xlabel='year', ylabel='passengers'>


sns.lineplot(data=flights, x='year', y='passengers')

<AxesSubplot:xlabel='year', ylabel='passengers'>


# month 별로 나누기 위해 hue 값을 줌
sns.lineplot(data=flights, x='year', y='passengers', hue='month', palette='ch:.50')
plt.legend(bbox_to_anchor=(1.03, 1), loc=2) #legend 그래프 밖에 추가하기

<matplotlib.legend.Legend at 0x7f7bd0878550>


# 히스토그램
sns.distplot(flights['passengers'])

/home/ssac24/anaconda3/envs/aiffel/lib/python3.7/site-packages/seaborn/distributions.py:2557: FutureWarning: `distplot` is a deprecated function and will be removed in a future version. Please adapt your code to use either `displot` (a figure-level function with similar flexibility) or `histplot` (an axes-level function for histograms).
  warnings.warn(msg, FutureWarning)

<AxesSubplot:xlabel='passengers', ylabel='Density'>


# 데이터의 재배치 pivot
pivot = flights.pivot(index='year', columns='month', values='passengers')
pivot


sns.heatmap(pivot)

<AxesSubplot:xlabel='month', ylabel='year'>


sns.heatmap(pivot, linewidths=.2, annot=True, fmt="d")

<AxesSubplot:xlabel='month', ylabel='year'>


sns.heatmap(pivot, cmap="YlGnBu")

<AxesSubplot:xlabel='month', ylabel='year'>

	total_bill	tip	size
count	244.000000	244.000000	244.000000
mean	19.785943	2.998279	2.569672
std	8.902412	1.383638	0.951100
min	3.070000	1.000000	1.000000
25%	13.347500	2.000000	2.000000
50%	17.795000	2.900000	2.000000
75%	24.127500	3.562500	3.000000
max	50.810000	10.000000	6.000000

	year	month	passengers
0	1949	January	112
1	1949	February	118
2	1949	March	132
3	1949	April	129
4	1949	May	121
...	...	...	...
139	1960	August	606
140	1960	September	508
141	1960	October	461
142	1960	November	390
143	1960	December	432

month	April	August	December	February	January	July	June	March	May	November	October	September
year
1949	129	148	118	118	112	148	135	132	121	104	119	136
1950	135	170	140	126	115	170	149	141	125	114	133	158
1951	163	199	166	150	145	199	178	178	172	146	162	184
1952	181	242	194	180	171	230	218	193	183	172	191	209
1953	235	272	201	196	196	264	243	236	229	180	211	237
1954	227	293	229	188	204	302	264	235	234	203	229	259
1955	269	347	278	233	242	364	315	267	270	237	274	312
1956	313	405	306	277	284	413	374	317	318	271	306	355
1957	348	467	336	301	315	465	422	356	355	305	347	404
1958	348	505	337	318	340	491	435	362	363	310	359	404
1959	396	559	405	342	360	548	472	406	420	362	407	463
1960	461	606	432	391	417	622	535	419	472	390	461	508

주사위 만들기 (0)	2021.01.25
sklearn의 이해 (0)	2021.01.22
fibonacci함수 (0)	2021.01.08
1주차 leetcode😢 (0)	2021.01.08
파이썬 명령어 모음 (0)	2020.12.31

A.I

A.I

파이썬으로 그래프 그리기 본문

파이썬으로 그래프 그리기

1. 파이썬으로 그래프 그리기¶

ipython 매직명령어 정리 ¶

2. 주석 기법을 통한 선 그래프 그리기¶

3. plt.plot()로 그래프 그리기¶

4. Pandas로 그래프 그리기¶

pandas.plot메서드 인자

pandas의 data가 DataFrame일때 plot 메서드 인자

각 요소 별 명칭¶

5. Seaborn 데이터로 그래프 그리기¶

5-1. 범주형 데이터 그래프¶

5-2. 수치형 그래프¶

5-3. 히스토그램¶

6. 시계열 데이터 그래프화¶

7. Heatmap¶

'파이썬 & AI 학습' 카테고리의 다른 글

티스토리툴바

	total_bill	tip	sex	smoker	day	time	size
0	16.99	1.01	Female	No	Sun	Dinner	2
1	10.34	1.66	Male	No	Sun	Dinner	3
2	21.01	3.50	Male	No	Sun	Dinner	3
3	23.68	3.31	Male	No	Sun	Dinner	2
4	24.59	3.61	Female	No	Sun	Dinner	4

« 2025/04 »
일	월	화	수	목	금	토
		1	2	3	4	5
6	7	8	9	10	11	12
13	14	15	16	17	18	19
20	21	22	23	24	25	26
27	28	29	30

A.I

파이썬으로 그래프 그리기 본문

파이썬으로 그래프 그리기

1. 파이썬으로 그래프 그리기¶

ipython 매직명령어 정리¶

2. 주석 기법을 통한 선 그래프 그리기¶

3. plt.plot()로 그래프 그리기¶

4. Pandas로 그래프 그리기¶

pandas.plot메서드 인자

pandas의 data가 DataFrame일때 plot 메서드 인자

각 요소 별 명칭¶

5. Seaborn 데이터로 그래프 그리기¶

5-1. 범주형 데이터 그래프¶

5-2. 수치형 그래프¶

5-3. 히스토그램¶

6. 시계열 데이터 그래프화¶

7. Heatmap¶

'파이썬 & AI 학습' 카테고리의 다른 글

티스토리툴바

ipython 매직명령어 정리 ¶