弹幕中主要导演被提及的次数
chen_num=df_all.content.str.contains('凯哥').sum()
dong_num=df_all.content.str.contains('东升').sum()
zhao_num=df_all.content.str.contains('赵薇').sum()
guo_num=df_all.content.str.contains('敬明 小四').sum()
li_num=df_all.content.str.contains('诚儒').sum()
print(chen_num,dong_num,zhao_num,guo_num,li_num)
data=pd.DataFrame({
'name':['陈凯歌','尔东升','赵薇','郭敬明','李诚儒'],'number':[chen_num,dong_num,zhao_num,guo_num,li_num]})
data=data.sort_values('number',ascending=False)
data
x_data=data['name'].values.tolist()
y_data=data['number'].values.tolist()
`
bar2=Bar(init_opts=opts.InitOpts(width='1350px',height='750px'))
bar2.add_xaxis(xaxis_data=x_data)
bar2.add_yaxis('',yaxis=y_data)
bar2.set_global_opts(title_opts=opts.TitleOpts(title='弹幕中主要导演被提及的次数'),visualmap_opts=opts.VisualMapOpts(max=60000,is_show=False))
bar2.render_notebook()
```python
actor='参演的所有演员名'
actor_listactor.split('/')
actor_list
`
tiji_num=[df_all.content.str.contains(i).sum() for i in actor_list]
top10=tiji_num[:9]``
df_actor=pd.DataFrame({
'actor_name':actor_list,'tiji_num':tiji_num})
df_actor.head(10)
x_data=df_actor['actor_name'].values.tolist()
y_data=['number'].values.tolist()
bar2=Bar(init_opts=opts.InitOpts(width='1350px',height='750px'))
bar2.add_xaxis(xaxis_data=x_data)
bar2.add_yaxis('',yaxis=y_data)
bar2.set_global_opts(title_opts=opts.TitleOpts(title='弹幕中主要导演被提及的次数'),visualmap_opts=opts.VisualMapOpts(max=60000,is_show=False))
bar2.render_notebook()