%%capture
!pip install wordcloud
import json
import matplotlib.pyplot as plt
import numpy as np
import os
import pandas as pd
import re
import seaborn as sns
from IPython import display
from wordcloud import WordCloud

pd.set_option("display.max_rows", 5)


df = pd.read_csv('2023-books.csv')
df['start_date'] = pd.to_datetime(df['start_date'])
df['end_date'] = pd.to_datetime(df['end_date'])
df['first_published'] = pd.to_datetime(df['first_published'])
df


def display_book(book, comment=''):
    return display.Markdown(f"""
![](https://egrajeda.com/images/{book['slug'].iloc[0]}.jpg)\n
{comment}
    """)


display.Markdown("I read a total of {:,} books".format(len(df)))


oldest_book = df.sort_values(by=['first_published']).head(1)
display_book(oldest_book, "☝️ First published in {:%B %d, %Y}".format(oldest_book['first_published'].iloc[0]))


total_pages = df['pages'].sum()
display.Markdown("A grand total of ✨ {:,} pages ✨".format(total_pages))


shortest_book = df.sort_values(by=['pages']).head(1)
longest_book = df.sort_values(by=['pages']).tail(1)
display_book(shortest_book, f"🫣 My shortest book was {shortest_book['pages'].iloc[0]} pages")


display_book(longest_book, f"💪 My longest book was {longest_book['pages'].iloc[0]} pages")


pages_mean = df['pages'].mean()
display.Markdown("My average book length was ✨ {:,.0f} pages ✨".format(pages_mean))


df['pages_per_day'] = df['pages'] / (df['end_date'] - df['start_date']).dt.days
slowest_book = df.sort_values(by=['pages_per_day']).head(1)
fastest_book = df.sort_values(by=['pages_per_day']).tail(1)

display_book(fastest_book, "🏃 Read {:,.0f} pages per day".format(fastest_book['pages_per_day'].iloc[0]))


display_book(slowest_book, "🐢 Read {:,.0f} pages per day".format(slowest_book['pages_per_day'].iloc[0]))


tags_count = df["tags"].str.split(',').explode("tags").value_counts()
tags_word_cloud = WordCloud(background_color="white").generate_from_frequencies(tags_count)
plt.imshow(tags_word_cloud, interpolation='bilinear')
plt.axis("off");

	name	slug	pages	start_date	end_date	first_published	tags
0	Zen Mind, Beginner's Mind: Informal talks on Z...	zen-mind-beginners-mind	138	2023-01-01	2023-01-15	1970-06-01	philosophy,buddhism,non-fiction
1	Tress of the Emerald Sea	tress-of-the-emerald-sea	369	2023-01-16	2023-01-22	2023-01-10	fantasy,fiction,cosmere
...	...	...	...	...	...	...	...
17	Doble Cara	doble-cara	416	2023-11-13	2023-12-08	2023-05-09	politics,non-fiction
18	Another Now	another-now	240	2023-12-09	2023-12-15	2020-09-10	economics,politics,fiction

2023 in Books¶

Setting up the data and some useful functions¶

🧮 How many books I read this year?¶

🧓 What was the oldest book I read this year?¶

🤔 How many pages I read this year?¶

Which one was the shortest 🫣 and the longest 💪 book I read this year?¶

📖 What was my average book length this year?¶

🏃 Which book did I read the fastest, and which one did I read the slowest?¶

☁️ What type of books I read this year?¶