メディア展開データの内訳を見る

メディア展開データの内訳を見る#

準備#

Import#

変数#

関数#

Show code cell content Hide code cell content

def create_mosaicplot(
    df: pd.DataFrame,
    x: str,
    y: str,
    color: str,
    width: str,
    text: str,
    color_discrete_sequence: List[str] = OKABE_ITO,
) -> go.Figure:
    """
    指定されたDataFrameを元にモザイクプロットを作成する関数

    Parameters
    ----------
    df : pd.DataFrame
        プロットに使用するデータが含まれるDataFrame
    x : str
        x軸に表示するデータのカラム名
    y : str
        y軸に表示するデータのカラム名
    color : str
        グループ分けの基準となるデータのカラム名
    width : str
        各バーの幅を表すデータのカラム名
    text : str
        各バーに表示するテキストのデータのカラム名
    color_discrete_sequence : List[str], optional
        使用する色のリスト デフォルトはOKABE_ITOのカラーパレット

    Returns
    -------
    go.Figure
        作成されたモザイクプロットのFigureオブジェクト
    """

    # 空のFigureオブジェクトを作成
    fig = go.Figure()

    # color列に登場するユニークな要素に対し、色をマッピング
    unique_keys = df[color].unique()
    color_map = {
        name: color for name, color in zip(unique_keys, color_discrete_sequence)
    }

    # color列のユニークな要素ごとにDataFrameをフィルタリング
    for i, name in enumerate(unique_keys):
        df_tmp = df[df[color] == name].reset_index(drop=True)
        # 幅をwidth列から抽出
        widths = df_tmp[width]

        # バーの位置を計算し、プロットに追加
        # 幅が変わるようxの値を調整
        fig.add_trace(
            go.Bar(
                name=name,
                x=df_tmp[width].cumsum() - widths,
                y=df_tmp[y],
                text=df_tmp[text],
                width=widths,
                offset=0,
                marker_color=color_map[name],
            )
        )

        # 最初の要素を用いて、X軸ラベルの設定値を作成
        if i == 0:
            # 各「棒」の中央に配置されるように座標を計算
            tickvals = df_tmp[width].cumsum() - df_tmp[width] / 2
            ticktext = df_tmp[x].unique()
            # x軸の表示範囲を決定するために利用
            x_max = df_tmp[width].sum()

    # x軸の目盛りの位置、テキスト、表示範囲を設定
    # 「棒」の太さの合計値を1としたとき、左右に0.1ずつ余白が残るように調整
    fig.update_xaxes(
        tickvals=tickvals, ticktext=ticktext, title=x, range=[-x_max * 0.1, x_max * 1.1]
    )

    # y軸のタイトルを設定
    fig.update_yaxes(title=y)

    # プロットのレイアウトを設定、凡例タイトルも指定
    fig.update_layout(barmode="stack", legend_title=color)

    return fig

可視化例#

円グラフ#

Show code cell content Hide code cell content

# 可視化対象のDataFrameを確認
df_pie.head()

	アニメ化	マンガ作品数
0	False	1208
1	True	129

Show code cell content Hide code cell content

# 可視化対象のDataFrameを確認
df_pie2.head()

	マンガ雑誌名	アニメ化	マンガ作品数
0	週刊少年サンデー	False	255
1	週刊少年サンデー	True	32
2	週刊少年ジャンプ	False	288
3	週刊少年ジャンプ	True	49
4	週刊少年チャンピオン	False	381

Show code cell content Hide code cell content

# 可視化対象のDataFrameを確認
df_pie3.head()

	マンガ雑誌名	アニメ化	マンガ作品数	アニメ化率
0	週刊少年チャンピオン	False	381	0.028061
1	週刊少年チャンピオン	True	11	0.028061
2	週刊少年サンデー	False	255	0.111498
3	週刊少年サンデー	True	32	0.111498
4	週刊少年マガジン	False	284	0.115265

棒グラフ#

Show code cell content Hide code cell content

# 可視化対象のDataFrameを確認
df_bar.head()

	マンガ雑誌名	アニメ化	マンガ作品数	マンガ雑誌名_total	比率	text	アニメ化率
0	週刊少年チャンピオン	True	11	392	0.028061	0.03	0.028061
1	週刊少年チャンピオン	False	381	392	0.971939	0.97	0.028061
2	週刊少年サンデー	True	32	287	0.111498	0.11	0.111498
3	週刊少年サンデー	False	255	287	0.888502	0.89	0.111498
4	週刊少年マガジン	True	37	321	0.115265	0.12	0.115265

モザイクプロット#

Show code cell content Hide code cell content

# 可視化対象のDataFrameを表示
df_mosaic.head()

	マンガ雑誌名	アニメ化	マンガ作品数	マンガ雑誌名_total	比率	text	アニメ化率
0	週刊少年チャンピオン	True	11	392	0.028061	0.03	0.028061
1	週刊少年チャンピオン	False	381	392	0.971939	0.97	0.028061
2	週刊少年サンデー	True	32	287	0.111498	0.11	0.111498
3	週刊少年サンデー	False	255	287	0.888502	0.89	0.111498
4	週刊少年マガジン	True	37	321	0.115265	0.12	0.115265

積上げ密度プロット[1]#

Show code cell content Hide code cell content

# 可視化対象のDataFrameを確認
df_area.head()

	連載開始年	アニメ化	マンガ作品数	first_year_cc_total	比率
0	1990	True	4	50	0.080000
1	1990	False	46	50	0.920000
2	1991	True	3	51	0.058824
3	1991	False	48	51	0.941176
4	1992	True	1	45	0.022222

Show code cell content Hide code cell content

# 2003年に連載が開始され、かつアニメ化された作品をフィルタリングし、特定の列のみ表示
df_cc_ac[(df_cc_ac["first_year_cc"] == 2003) & (df_cc_ac["is_animated"])][
    ["mcname", "ccname", "acname"]
]

	mcname	ccname	acname
623	週刊少年サンデー	MAR メル	MÄR メルヘヴン MÄRCHEN AWAKENS ROMANCE
629	週刊少年マガジン	魔法先生ネギま! MAGISTER NEGI MAGI	魔法先生ネギま!
637	週刊少年サンデー	結界師	結界師
640	週刊少年マガジン	ツバサ～RESERVoir CHRoNiCLE～	ツバサ・クロニクル　年代記[第1期]
644	週刊少年ジャンプ	武装錬金	武装錬金
652	週刊少年ジャンプ	DEATH NOTE	DEATH NOTE
663	週刊少年ジャンプ	家庭教師ヒットマンREBORN!	家庭教師* ヒットマン REBORN! *［かてきょー］
664	週刊少年マガジン	涼風	涼風［すずか］

Show code cell content Hide code cell content

# 可視化対象のDataFrameを確認
df_area2.head()

	マンガ雑誌名	連載開始年	アニメ化	マンガ作品数	mcname_fyear_total	比率
0	週刊少年サンデー	1990	True	1	12	0.083333
1	週刊少年サンデー	1990	False	11	12	0.916667
2	週刊少年サンデー	1991	True	1	10	0.100000
3	週刊少年サンデー	1991	False	9	10	0.900000
4	週刊少年サンデー	1992	False	14	14	1.000000

ツリーマップ#

Show code cell content Hide code cell content

# 可視化対象のDataFrameを確認
df_tree.head()

	マンガ雑誌名	マンガ作品名	アニメ各話数
0	週刊少年サンデー	うしおととら	26.0
1	週刊少年マガジン	シュート!	58.0
2	週刊少年ジャンプ	SLAM DUNK	101.0
3	週刊少年ジャンプ	幽☆遊☆白書	112.0
4	週刊少年サンデー	ゴーストスイーパー美神極楽大作戦!!	45.0

パラレルセットグラフ#

Show code cell content Hide code cell content

# 可視化対象のDataFrameを確認
df_par.head()

	マンガ作品ID	アニメ化	合計話数	マンガ雑誌名
0	C92355	False	8-17話	週刊少年サンデー
1	C93126	False	8-17話	週刊少年サンデー
2	C91698	False	8-17話	週刊少年サンデー
3	C93467	False	8-17話	週刊少年サンデー
4	C93829	False	8-17話	週刊少年サンデー

メディア展開データの内訳を見る

Contents

メディア展開データの内訳を見る#

準備#

Import#

変数#

関数#

可視化例#

円グラフ#

棒グラフ#

モザイクプロット#

積上げ密度プロット[1]#

ツリーマップ#

パラレルセットグラフ#