from matplotlib import pyplot as plt


movies = ["Annie Hall", "Ben-Hur", "Casablanca", "Gandhi", "West Side Story"]
num_oscars = [5, 11, 3, 8, 10]

plt.bar(range(len(movies)), num_oscars)  # x축 레이블 = [0, 1, 2, 3, 4]
plt.ylabel("# of Academy Awards")        # y축 레이블
plt.xticks(range(len(movies)), movies)   # x축 레이블 = movies 로 변경

plt.show()


mentions = [500, 505]
years = [2017, 2018]

plt.bar(years, mentions, 0.8)
plt.xticks(years)             # x축 레이블 표시에 필수적임
plt.ylabel("# of times I heard someone say 'data science'")

plt.ticklabel_format(useOffset=False)

# y축의 시작점을 499로 잡으면 오해를 불러일으킬 수 있음.
plt.axis([2016.5, 2018.5, 499, 506])
plt.title("Look at the 'Huge' Increase!")
plt.show()


plt.bar(years, mentions, 0.8)
plt.xticks(years)
plt.ylabel("# of times I heard someone say 'data science'")
plt.ticklabel_format(useOffset=False)

# y축의 시작점을 0으로 잡으면 상황이 달라짐.
plt.axis([2016.5, 2018.5, 0, 550])
plt.title("Not So Huge Anymore")

plt.tight_layout()

plt.show()


from collections import Counter
grades = [83, 95, 91, 87, 70, 0, 85, 82, 100, 67, 73, 77, 0]

histogram = Counter(min(grade // 10 * 10, 90) for grade in grades)

plt.bar([x + 5 for x in histogram.keys()],  
        histogram.values(),                 
        10,                                 
        edgecolor=(0, 0, 0))                

plt.axis([-5, 105, 0, 5])                  
                                           

plt.xticks([10 * i for i in range(11)])    
plt.xlabel("Decile")
plt.ylabel("# of Students")
plt.title("Distribution of Exam 1 Grades")
plt.show()


years = [1950, 1960, 1970, 1980, 1990, 2000, 2010]
gdp = [300.2, 543.3, 1075.9, 2862.5, 5979.6, 10289.7, 14958.3]

plt.plot(years, gdp, color='green', marker='o', linestyle='solid')

plt.title("Nominal GDP")
plt.ylabel("Billions of $")
plt.show()


friends = [ 70,  65,  72,  63,  71,  64,  60,  64,  67]
minutes = [175, 170, 205, 120, 220, 130, 105, 145, 190]
labels =  ['a', 'b', 'c', 'd', 'e', 'f', 'g', 'h', 'i']

plt.scatter(friends, minutes)

for label, friend_count, minute_count in zip(labels, friends, minutes):
    plt.annotate(label,
        xy=(friend_count, minute_count), 
        xytext=(5, -5),                  
        textcoords='offset points')

plt.title("Daily Minutes vs. Number of Friends")
plt.xlabel("# of friends")
plt.ylabel("daily minutes spent on the site")
plt.show()


test_1_grades = [ 99, 90, 85, 97, 80]
test_2_grades = [100, 85, 60, 90, 70]

plt.scatter(test_1_grades, test_2_grades)
plt.title("Axes Aren't Comparable")
plt.xlabel("test 1 grade")
plt.ylabel("test 2 grade")
plt.show()


test_1_grades = [ 99, 90, 85, 97, 80]
test_2_grades = [100, 85, 60, 90, 70]
plt.scatter(test_1_grades, test_2_grades)
plt.title("Axes Are Comparable")
plt.axis("equal")                  # 양 축의 비율을 동일하게 함
plt.xlabel("test 1 grade")
plt.ylabel("test 2 grade")
plt.show()

점수 구간(십분위수)	0-9	10-19	20-29	30-39	40-49	50-59	60-69	70-79	80-89	90-100
학생 수	2	0	0	0	0	0	1	3	4	3

그래프와 시각화 1편¶

막대 그래프¶

막대 그래프 예제¶

막대 그래프 유의사항¶

y축의 시작을 499로 잡는 경우¶

y축의 시작을 0으로 잡는 경우¶

히스토그램¶

히스토그램 예제¶

선 그래프¶

선 그래프 예제¶

산점도¶

산점도 예제¶

산점도 유의사항¶

축 지정¶

양 축의 척도(scale)가 다른 경우¶

양 축의 척도가 동일한 경우¶

영화 제목	Annie Hall	Ben-Hur	Casablanca	Gandhi	West Side Story
수상 횟수	5	11	3	8	10

연도	1950	1960	1970	1980	1990	2000	2010
GDP	300.2	543.3	1075.9	2862.5	5979.6	10289.7	14958.3

친구 수	70	65	72	63	71	64	60	64	67
이용 시간	175	170	205	120	220	130	105	145	190
사용자 라벨	a	b	c	d	e	f	g	h	i

연도	2017	2018
횟수	500	505

1차 테스트	99	90	85	97	80
2차 테스트	100	85	60	90	70