基于提供的数据,我们可以进行以下几个方面的核心分析:
import pandas as pd
import numpy as np
# 假设我们有一个DataFrame df 包含了所有直播间的数据
df = pd.read_csv('livestream_data.csv') # 从CSV文件加载数据
# 计算短视频引流占比
df['ShortVideoReferralRatio'] = df['ShortVideoTraffic'] / (df['TotalTraffic'] - df['OtherTraffic'])
# 排名前3个直播间
top_3_sales_indices = df['Sales'].nlargest(3).index.tolist()
top_3_referrals = df.loc[top_3_sales_indices, 'ShortVideoTraffic'].sum() / df['ShortVideoTraffic'].sum()
# 筛选出引流占比较高的直播间
high_referral_ratio = 0.25 # 假设选择前25%的直播间
high_referring_livestreams = df[df['ShortVideoReferralRatio'] >= np.percentile(df['ShortVideoReferralRatio'], high_referral_ratio)]
common_categories = high_referring_livestreams['Category'].value_counts()
# 粉丝数与引流能力的关系
fans_vs_referrals = pd.DataFrame({
'Fans': df['Fans'],
'ReferralRatio': df['ShortVideoReferralRatio']
})
slope, intercept, r_value, p_value, std_err = np.polyfit(fans_vs_referrals['Fans'], fans_vs_referrals['ReferralRatio'], 1)
print(f"回归斜率: {slope}, 截距: {intercept}, 相关系数: {r_value}")
以上分析数据来源:互联岛