import random
import string
import matplotlib.pyplot as plt
import pandas as pd
from collections import Counter

df = pd.read_csv("top-1m.csv")

domain_list = df['domain'].values.tolist()


first_letter_counts = Counter([domain[0] for domain in domain_list])

df = pd.DataFrame.from_dict(
    first_letter_counts, orient="index", columns=["count"]
).sort_index()

plt.figure(figsize=(12, 6))
plt.bar(df.index, df["count"])
plt.title("Distribution of First Letters in Domain Names")
plt.xlabel("First Letter")
plt.ylabel("Count")
plt.xticks(fontsize=10)
plt.yticks(fontsize=10)
plt.grid(axis="y", linestyle="--", alpha=0.7)

plt.savefig("first_letter_distribution.png")
