Certifications#

We used RIAA Artists By Certified Album Units Sold to see the certification levels (Gold, Platinum, Multi-Platinum, and Diamond) and certified album sales for the top 25 music artists (based on album sales). These are provided by the database of RIAA.

Here we can see that The Beatles have the most amount of album sales. It is interesting to note that Elvis Presley has the most amount of Gold certifications by a big margin and also has the most amount of Platinum certifications.

Hide code cell source
import plotly.graph_objs as go
import plotly.express as px
import pandas as pd

df = pd.read_csv('../cleaned/riaakaggle.csv')
df = df.head(n=25)

line = dict(color='black', width=0.4)

data = [
    go.Bar(name='Certified (Million albums sold)', x=df['Artist'], y=df['Certified Units'], marker=dict(color='rgb(102,194,165)', line=line)),
    go.Bar(name='Gold (units)', x=df['Artist'], y=df['Gold'], marker=dict(color='rgb(245, 242, 76)', line=line)),
    go.Bar(name='Platinum (units)', x=df['Artist'], y=df['Platinum'], marker=dict(color='rgb(160, 178, 198)', line=line)),
    go.Bar(name='Multi-Platinum (units)', x=df['Artist'], y=df['Multi-Platinum'], marker=dict(color='rgb(148, 148, 143)', line=line)),
    go.Bar(name='Diamond (units)', x=df['Artist'], y=df['Diamond'], marker=dict(color='rgb(160,225,245)', line=line))
]

layout = go.Layout(
    title='Top 25 music artists by album sales with certificates',
    height=600,
    xaxis=go.layout.XAxis(
        type='category',
        title='Artist'
    ),
    yaxis=go.layout.YAxis(
        title='Units'
    ),
    barmode='group'
)

fig = go.Figure(data=data, layout=layout)
fig.show()