一矢多穿:多目标排序在爱奇艺短视频推荐中的应用

{"type":"doc","content":[{"type":"paragraph","attrs":{"indent":0,"number":0,"align":null,"origin":null},"content":[{"type":"text","text":"短视频具有","attrs":{}},{"type":"text","marks":[{"type":"strong","attrs":{}}],"text":"内容丰富、信息集中、用户粘性大","attrs":{}},{"type":"text","text":"的特点,如何提高短视频","attrs":{}},{"type":"text","marks":[{"type":"strong","attrs":{}}],"text":"分发的效率","attrs":{}},{"type":"text","text":"和","attrs":{}},{"type":"text","marks":[{"type":"strong","attrs":{}}],"text":"推荐精准度","attrs":{}},{"type":"text","text":",有效提升","attrs":{}},{"type":"text","marks":[{"type":"strong","attrs":{}}],"text":"消费时长、留存","attrs":{}},{"type":"text","text":"等关键业务指标,是","attrs":{}},{"type":"text","marks":[{"type":"strong","attrs":{}}],"text":"推荐系统","attrs":{}},{"type":"text","text":"的核心能力和建模目标。","attrs":{}}]},{"type":"paragraph","attrs":{"indent":0,"number":0,"align":null,"origin":null}},{"type":"paragraph","attrs":{"indent":0,"number":0,"align":null,"origin":null},"content":[{"type":"text","text":"本文主要分享在","attrs":{}},{"type":"text","marks":[{"type":"strong","attrs":{}}],"text":"短视频推荐","attrs":{}},{"type":"text","text":"场景下,爱奇艺基础推荐团队在","attrs":{}},{"type":"text","marks":[{"type":"strong","attrs":{}}],"text":"排序模型多目标优化","attrs":{}},{"type":"text","text":"方面的","attrs":{}},{"type":"text","marks":[{"type":"strong","attrs":{}}],"text":"历史","attrs":{}},{"type":"text","text":"和","attrs":{}},{"type":"text","marks":[{"type":"strong","attrs":{}}],"text":"进展","attrs":{}},{"type":"text","text":"。第一部分主要介绍","attrs":{}},{"type":"text","marks":[{"type":"strong","attrs":{}}],"text":"多目标建模的业务背景","attrs":{}},{"type":"text","text":",第二部分介绍爱奇艺在短视频推荐业务","attrs":{}},{"type":"text","marks":[{"type":"strong","attrs":{}}],"text":"多目标建模方向","attrs":{}},{"type":"text","text":"尝试和实践的","attrs":{}},{"type":"text","marks":[{"type":"strong","attrs":{}}],"text":"多种方案","attrs":{}},{"type":"text","text":",最后是简单的","attrs":{}},{"type":"text","marks":[{"type":"strong","attrs":{}}],"text":"总结","attrs":{}},{"type":"text","text":"和在多目标建模方向的","attrs":{}},{"type":"text","marks":[{"type":"strong","attrs":{}}],"text":"规划","attrs":{}},{"type":"text","text":"。","attrs":{}}]},{"type":"heading","attrs":{"align":null,"level":2},"content":[{"type":"text","text":"01 背景","attrs":{}}]},{"type":"paragraph","attrs":{"indent":0,"number":0,"align":null,"origin":null}},{"type":"paragraph","attrs":{"indent":0,"number":0,"align":null,"origin":null},"content":[{"type":"text","text":"在爱奇艺短视频推荐业务中,主要","attrs":{}},{"type":"text","marks":[{"type":"strong","attrs":{}}],"text":"流量形态","attrs":{}},{"type":"text","text":"由","attrs":{}},{"type":"text","marks":[{"type":"strong","attrs":{}}],"text":"两个部分组成:","attrs":{}}]},{"type":"paragraph","attrs":{"indent":0,"number":0,"align":null,"origin":null}},{"type":"paragraph","attrs":{"indent":0,"number":0,"align":null,"origin":null},"content":[{"type":"text","text":"(1) 爱奇艺APP ","attrs":{}},{"type":"text","marks":[{"type":"strong","attrs":{}}],"text":"底Tab的随刻视频","attrs":{}},{"type":"text","text":"以及","attrs":{}},{"type":"text","marks":[{"type":"strong","attrs":{}}],"text":"顶导航的热点模块","attrs":{}}]},{"type":"paragraph","attrs":{"indent":0,"number":0,"align":null,"origin":null}},{"type":"paragraph","attrs":{"indent":0,"number":0,"align":null,"origin":null},"content":[{"type":"text","text":"(2) 爱奇艺","attrs":{}},{"type":"text","marks":[{"type":"strong","attrs":{}}],"text":"随刻APP 首页","attrs":{}},{"type":"text","text":"短视频流推荐页面","attrs":{}}]},{"type":"paragraph","attrs":{"indent":0,"number":0,"align":null,"origin":null}},{"type":"image","attrs":{"src":"https://static001.geekbang.org/infoq/f3/f35b005dcb5f1da0475a2a93ba12fa49.jpeg","alt":null,"title":null,"style":[{"key":"width","value":"75%"},{"key":"bordertype","value":"none"}],"href":null,"fromPaste":true,"pastePass":true}},{"type":"paragraph","attrs":{"indent":0,"number":0,"align":"center","origin":null},"content":[{"type":"text","marks":[{"type":"size","attrs":{"size":10}}],"text":"图1:短视频推荐页面","attrs":{}}]},{"type":"paragraph","attrs":{"indent":0,"number":0,"align":null,"origin":null}},{"type":"paragraph","attrs":{"indent":0,"number":0,"align":null,"origin":null},"content":[{"type":"text","text":"用户在","attrs":{}},{"type":"text","marks":[{"type":"strong","attrs":{}}],"text":"feed流页面的行为","attrs":{}},{"type":"text","text":"分为:","attrs":{}}]},{"type":"paragraph","attrs":{"indent":0,"number":0,"align":null,"origin":null}},{"type":"paragraph","attrs":{"indent":0,"number":0,"align":null,"origin":null},"content":[{"type":"text","marks":[{"type":"strong","attrs":{}}],"text":"显示反馈:","attrs":{}},{"type":"text","text":"点击播放,点击up主头像、关注、点击/发布评论、收藏、点击圈子、分享等正向互动行为,点击不喜欢、举报等负向行为。","attrs":{}}]},{"type":"paragraph","attrs":{"indent":0,"number":0,"align":null,"origin":null}},{"type":"paragraph","attrs":{"indent":0,"number":0,"align":null,"origin":null},"content":[{"type":"text","marks":[{"type":"strong","attrs":{}}],"text":"隐式反馈","attrs":{}},{"type":"text","text":":播放时长、完成率、用户快速划过等行为。","attrs":{}}]},{"type":"paragraph","attrs":{"indent":0,"number":0,"align":null,"origin":null}},{"type":"paragraph","attrs":{"indent":0,"number":0,"align":null,"origin":null},"content":[{"type":"text","text":"起初排序模型是以","attrs":{}},{"type":"text","marks":[{"type":"strong","attrs":{}}],"text":"点击+时长","attrs":{}},{"type":"text","text":"的","attrs":{}},{"type":"text","marks":[{"type":"strong","attrs":{}}],"text":"多目标模型","attrs":{}},{"type":"text","text":",随着业务发展和模型迭代,我们需要","attrs":{}},{"type":"text","marks":[{"type":"strong","attrs":{}}],"text":"兼顾用户评论、点赞等强互动行为","attrs":{}},{"type":"text","text":"的生态收益,","attrs":{}},{"type":"text","marks":[{"type":"strong","attrs":{}}],"text":"减少用户短停等负向内容","attrs":{}},{"type":"text","text":"的推荐。因此,我们在推荐系统多目标建模方向进行了一系列的尝试和实践,并在短视频推荐业务完成了技术落地,实现了","attrs":{}},{"type":"text","marks":[{"type":"strong","attrs":{}}],"text":"人均播放时长提升7%+、互动提升20%+","attrs":{}},{"type":"text","text":"等各项指标的正向收益。","attrs":{}}]},{"type":"heading","attrs":{"align":null,"level":2},"content":[{"type":"text","text":"02 多目标在短视频推荐业务中的实践","attrs":{}}]},{"type":"heading","attrs":{"align":null,"level":3},"content":[{"type":"text","text":"1.融合时长权重的点击率预估模型","attrs":{}}]},{"type":"paragraph","attrs":{"indent":0,"number":0,"align":null,"origin":null}},{"type":"paragraph","attrs":{"indent":0,"number":0,"align":null,"origin":null},"content":[{"type":"text","text":"在基于","attrs":{}},{"type":"text","marks":[{"type":"strong","attrs":{}}],"text":"ctr预估","attrs":{}},{"type":"text","text":"的视频推荐中,普遍采用","attrs":{}},{"type":"text","marks":[{"type":"strong","attrs":{}}],"text":"YouTube的权重策略","attrs":{}},{"type":"text","text":":","attrs":{}}]},{"type":"paragraph","attrs":{"indent":0,"number":0,"align":null,"origin":null}},{"type":"paragraph","attrs":{"indent":0,"number":0,"align":null,"origin":null},"content":[{"type":"text","marks":[{"type":"strong","attrs":{}}],"text":"将正样本的播放时长作为样本权重,用加权的逻辑回归训练分类任务。","attrs":{}}]},{"type":"paragraph","attrs":{"indent":0,"number":0,"align":null,"origin":null}},{"type":"paragraph","attrs":{"indent":0,"number":0,"align":null,"origin":null},"content":[{"type":"text","text":"该策略会造成","attrs":{}},{"type":"text","marks":[{"type":"strong","attrs":{}}],"text":"长视频的权重较高","attrs":{}},{"type":"text","text":",","attrs":{}},{"type":"text","marks":[{"type":"strong","attrs":{}}],"text":"模型偏向推出长视频。","attrs":{}},{"type":"text","text":"综合来看,无论将播放时长还是完播率作为样本权重,都会导致模型对长短视频有所偏重。","attrs":{}}]},{"type":"paragraph","attrs":{"indent":0,"number":0,"align":null,"origin":null}},{"type":"paragraph","attrs":{"indent":0,"number":0,"align":null,"origin":null},"content":[{"type":"text","text":"因此,权重设计方案应","attrs":{}},{"type":"text","marks":[{"type":"strong","attrs":{}}],"text":"确定合理的假设","attrs":{}},{"type":"text","text":":","attrs":{}},{"type":"text","marks":[{"type":"strong","attrs":{}}],"text":"视频推出质量与视频长度无关,且在视频时长的各区间下应近似均匀分布。","attrs":{}},{"type":"text","text":"即在任何区间下,样本权重的均值大概相同。则有:","attrs":{}}]},{"type":"image","attrs":{"src":"https://static001.geekbang.org/infoq/f4/f4dc8105fd0b49f2867a76c2173cbc99.jpeg","alt":null,"title":null,"style":[{"key":"width","value":"75%"},{"key":"bordertype","value":"none"}],"href":null,"fromPaste":true,"pastePass":true}},{"type":"paragraph","attrs":{"indent":0,"number":0,"align":null,"origin":null}},{"type":"paragraph","attrs":{"indent":0,"number":0,"align":null,"origin":null},"content":[{"type":"text","text":"采用","attrs":{}},{"type":"text","marks":[{"type":"strong","attrs":{}}],"text":"等频分桶","attrs":{}},{"type":"text","text":"的方式,对一定时间窗口内的播放样本按照","attrs":{}},{"type":"text","marks":[{"type":"strong","attrs":{}}],"text":"duration(视频时长)","attrs":{}},{"type":"text","text":"排序分散到100个桶,确保同一桶中视频观看数相同。进一步地对每个duration桶按照playtime(播放时长)排序再次等频分散到100个桶,","attrs":{}},{"type":"text","marks":[{"type":"strong","attrs":{}}],"text":"并将权重归一化到[0,99]的区间整数。","attrs":{}},{"type":"text","text":"因此对所有样本,均可按照(duration,playtime)确定固定的","attrs":{}},{"type":"text","marks":[{"type":"strong","attrs":{}}],"text":"分桶座标","attrs":{}},{"type":"text","text":"和","attrs":{}},{"type":"text","marks":[{"type":"strong","attrs":{}}],"text":"权值","attrs":{}},{"type":"text","text":"。","attrs":{}}]},{"type":"paragraph","attrs":{"indent":0,"number":0,"align":null,"origin":null}},{"type":"image","attrs":{"src":"https://static001.geekbang.org/infoq/6d/6d3f8580a2cf075a1ad810142f676b31.jpeg","alt":null,"title":null,"style":[{"key":"width","value":"75%"},{"key":"bordertype","value":"none"}],"href":null,"fromPaste":true,"pastePass":true}},{"type":"paragraph","attrs":{"indent":0,"number":0,"align":"center","origin":null},"content":[{"type":"text","marks":[{"type":"size","attrs":{"size":10}}],"text":"图2:对视频时长和播放时长进行分桶","attrs":{}}]},{"type":"paragraph","attrs":{"indent":0,"number":0,"align":null,"origin":null}},{"type":"paragraph","attrs":{"indent":0,"number":0,"align":null,"origin":null},"content":[{"type":"text","text":"在确定整体的权重计算框架后,进一步对playtime较高的样本权重进行整体提升。预期","attrs":{}},{"type":"text","marks":[{"type":"strong","attrs":{}}],"text":"优化消费时长的指标,同时控制长视频的偏向。","attrs":{}},{"type":"text","text":"具体的boosting方案:","attrs":{}}]},{"type":"image","attrs":{"src":"https://static001.geekbang.org/infoq/36/36beed721916c5c61c24b34940753ed6.png","alt":null,"title":null,"style":[{"key":"width","value":"75%"},{"key":"bordertype","value":"none"}],"href":null,"fromPaste":true,"pastePass":true}},{"type":"paragraph","attrs":{"indent":0,"number":0,"align":null,"origin":null}},{"type":"paragraph","attrs":{"indent":0,"number":0,"align":null,"origin":null},"content":[{"type":"text","text":"其中,","attrs":{}},{"type":"text","marks":[{"type":"strong","attrs":{}}],"text":"Am是上界值,shift是下界值,offset是时长偏移量,slope是斜率。","attrs":{}}]},{"type":"paragraph","attrs":{"indent":0,"number":0,"align":null,"origin":null}},{"type":"paragraph","attrs":{"indent":0,"number":0,"align":null,"origin":null},"content":[{"type":"text","text":"为了完善视频生态,保证新老视频的权重具有一定的区分度。我们融合了","attrs":{}},{"type":"text","marks":[{"type":"strong","attrs":{}}],"text":"视频年龄","attrs":{}},{"type":"text","text":"(用户行为时间-视频发布时间)对样本降权","attrs":{}},{"type":"text","marks":[{"type":"strong","attrs":{}}],"text":"(年龄越大,权重越低)","attrs":{}},{"type":"text","text":"。同时,为了能够使权重配置及时拟合整体用户最近的消费习惯,在保证任务产出效率的基础上,分别对不同平台用户生成","attrs":{}},{"type":"text","marks":[{"type":"strong","attrs":{}}],"text":"特定权重配置","attrs":{}},{"type":"text","text":",实现了","attrs":{}},{"type":"text","marks":[{"type":"strong","attrs":{}}],"text":"周期性更新","attrs":{}},{"type":"text","text":"。","attrs":{}}]},{"type":"paragraph","attrs":{"indent":0,"number":0,"align":null,"origin":null}},{"type":"paragraph","attrs":{"indent":0,"number":0,"align":null,"origin":null},"content":[{"type":"text","marks":[{"type":"strong","attrs":{}}],"text":"线上收益:人均播放时长提升3%,UCTR提升0.2%","attrs":{}}]},{"type":"paragraph","attrs":{"indent":0,"number":0,"align":null,"origin":null}},{"type":"paragraph","attrs":{"indent":0,"number":0,"align":null,"origin":null},"content":[{"type":"text","text":"这种方案的优缺点:","attrs":{}}]},{"type":"paragraph","attrs":{"indent":0,"number":0,"align":null,"origin":null}},{"type":"paragraph","attrs":{"indent":0,"number":0,"align":null,"origin":null},"content":[{"type":"text","marks":[{"type":"strong","attrs":{}}],"text":"优点:","attrs":{}},{"type":"text","text":"融合样本分布信息,","attrs":{}},{"type":"text","marks":[{"type":"strong","attrs":{}}],"text":"拟合近期消费习惯","attrs":{}},{"type":"text","text":"。模型调节简单,","attrs":{}},{"type":"text","marks":[{"type":"strong","attrs":{}}],"text":"可快速上线迭代。","attrs":{}}]},{"type":"paragraph","attrs":{"indent":0,"number":0,"align":null,"origin":null}},{"type":"paragraph","attrs":{"indent":0,"number":0,"align":null,"origin":null},"content":[{"type":"text","marks":[{"type":"strong","attrs":{}}],"text":"缺点:","attrs":{}},{"type":"text","text":"将时长转为样本权重","attrs":{}},{"type":"text","marks":[{"type":"strong","attrs":{}}],"text":"影响训练loss","attrs":{}},{"type":"text","text":",","attrs":{}},{"type":"text","marks":[{"type":"strong","attrs":{}}],"text":"本质并非对多目标建模","attrs":{}},{"type":"text","text":",而是将不同目标的信息转移到统一的目标上优化。而且时长信息利用不够充分,","attrs":{}},{"type":"text","marks":[{"type":"strong","attrs":{}}],"text":"收益有限。","attrs":{}}]},{"type":"heading","attrs":{"align":null,"level":3},"content":[{"type":"text","text":"2.多模型融合","attrs":{}}]},{"type":"paragraph","attrs":{"indent":0,"number":0,"align":null,"origin":null}},{"type":"image","attrs":{"src":"https://static001.geekbang.org/infoq/76/76834111a2c07a44c8fc48431a442d3f.jpeg","alt":null,"title":null,"style":[{"key":"width","value":"75%"},{"key":"bordertype","value":"none"}],"href":null,"fromPaste":true,"pastePass":true}},{"type":"paragraph","attrs":{"indent":0,"number":0,"align":"center","origin":null},"content":[{"type":"text","marks":[{"type":"size","attrs":{"size":10}}],"text":"图3:多模型融合","attrs":{}}]},{"type":"paragraph","attrs":{"indent":0,"number":0,"align":null,"origin":null}},{"type":"paragraph","attrs":{"indent":0,"number":0,"align":null,"origin":null},"content":[{"type":"text","marks":[{"type":"strong","attrs":{}}],"text":"多模型融合是指分别对每个目标训练一个模型,各预估得分根据目标重要性、业务指标需求等策略相加/相乘后进行融合排序。","attrs":{}}]},{"type":"paragraph","attrs":{"indent":0,"number":0,"align":null,"origin":null}},{"type":"paragraph","attrs":{"indent":0,"number":0,"align":null,"origin":null},"content":[{"type":"text","text":"在这里,我们分别训练纯点击的","attrs":{}},{"type":"text","marks":[{"type":"strong","attrs":{}}],"text":"二分类模型","attrs":{}},{"type":"text","text":"以及","attrs":{}},{"type":"text","marks":[{"type":"strong","attrs":{}}],"text":"观看时长预估的回归模型","attrs":{}},{"type":"text","text":"。在离线调节融合参数时,采用","attrs":{}},{"type":"text","marks":[{"type":"strong","attrs":{}}],"text":"grid search","attrs":{}},{"type":"text","text":"的方式选择更好的组合值。","attrs":{}}]},{"type":"paragraph","attrs":{"indent":0,"number":0,"align":null,"origin":null}},{"type":"paragraph","attrs":{"indent":0,"number":0,"align":null,"origin":null},"content":[{"type":"text","text":"这种方案的优缺点:","attrs":{}}]},{"type":"paragraph","attrs":{"indent":0,"number":0,"align":null,"origin":null}},{"type":"paragraph","attrs":{"indent":0,"number":0,"align":null,"origin":null},"content":[{"type":"text","marks":[{"type":"strong","attrs":{}}],"text":"优点","attrs":{}},{"type":"text","text":":模型单独训练,","attrs":{}},{"type":"text","marks":[{"type":"strong","attrs":{}}],"text":"只需要让单个模型达到“最好”,不需要考虑其它目标。","attrs":{}}]},{"type":"paragraph","attrs":{"indent":0,"number":0,"align":null,"origin":null}},{"type":"paragraph","attrs":{"indent":0,"number":0,"align":null,"origin":null},"content":[{"type":"text","marks":[{"type":"strong","attrs":{}}],"text":"缺点:","attrs":{}},{"type":"text","text":"多个目标重要性难以估算,","attrs":{}},{"type":"text","marks":[{"type":"strong","attrs":{}}],"text":"组合困难","attrs":{}},{"type":"text","text":";考虑到数据集分布和模型训练的稳定性变化,需要","attrs":{}},{"type":"text","marks":[{"type":"strong","attrs":{}}],"text":"评估模型更新和组合参数的更新时机","attrs":{}},{"type":"text","text":";在线服务","attrs":{}},{"type":"text","marks":[{"type":"strong","attrs":{}}],"text":"计算量大","attrs":{}},{"type":"text","text":",请求时长取决于较复杂的模型且","attrs":{}},{"type":"text","marks":[{"type":"strong","attrs":{}}],"text":"资源消耗巨大","attrs":{}},{"type":"text","text":";如果增加的新目标数据比较稀疏,","attrs":{}},{"type":"text","marks":[{"type":"strong","attrs":{}}],"text":"难以进行有效的模型训练和迭代。","attrs":{}}]},{"type":"heading","attrs":{"align":null,"level":3},"content":[{"type":"text","text":"3.多任务学习-网络优化","attrs":{}}]},{"type":"paragraph","attrs":{"indent":0,"number":0,"align":null,"origin":null}},{"type":"paragraph","attrs":{"indent":0,"number":0,"align":null,"origin":null},"content":[{"type":"text","text":"随着爱奇艺随刻App朝着","attrs":{}},{"type":"text","marks":[{"type":"strong","attrs":{}}],"text":"社区化","attrs":{}},{"type":"text","text":"的方向建设,要求feed流推荐效果在保证用户","attrs":{}},{"type":"text","marks":[{"type":"strong","attrs":{}}],"text":"观看时长、观看视频数、点击率","attrs":{}},{"type":"text","text":"等基础指标稳定的情况下,引导用户评论、点赞等互动。基于业务现状和之前的迭代基础,我们在","attrs":{}},{"type":"text","marks":[{"type":"strong","attrs":{}}],"text":"多任务学习","attrs":{}},{"type":"text","text":"上进行了一系列探索和实践。","attrs":{}}]},{"type":"paragraph","attrs":{"indent":0,"number":0,"align":null,"origin":null}},{"type":"paragraph","attrs":{"indent":0,"number":0,"align":null,"origin":null},"content":[{"type":"text","text":"在深度学习领域,多任务学习通常","attrs":{}},{"type":"text","marks":[{"type":"strong","attrs":{}}],"text":"共享底层表示","attrs":{}},{"type":"text","text":",将多个任务放在一起学习,通过浅层的共享促进","attrs":{}},{"type":"text","marks":[{"type":"strong","attrs":{}}],"text":"相互学习","attrs":{}},{"type":"text","text":"。同时,由于","attrs":{}},{"type":"text","marks":[{"type":"strong","attrs":{}}],"text":"反向传播优化联合Loss","attrs":{}},{"type":"text","text":",会兼顾","attrs":{}},{"type":"text","marks":[{"type":"strong","attrs":{}}],"text":"多任务间的约束关系","attrs":{}},{"type":"text","text":",因此能够有效","attrs":{}},{"type":"text","marks":[{"type":"strong","attrs":{}}],"text":"防止过拟合。","attrs":{}}]},{"type":"paragraph","attrs":{"indent":0,"number":0,"align":null,"origin":null}},{"type":"paragraph","attrs":{"indent":0,"number":0,"align":null,"origin":null},"content":[{"type":"text","text":"目前工业界主要有","attrs":{}},{"type":"text","marks":[{"type":"strong","attrs":{}}],"text":"两种方法","attrs":{}},{"type":"text","text":"对多任务进行建模:","attrs":{}}]},{"type":"paragraph","attrs":{"indent":0,"number":0,"align":null,"origin":null}},{"type":"paragraph","attrs":{"indent":0,"number":0,"align":null,"origin":null},"content":[{"type":"text","marks":[{"type":"strong","attrs":{}}],"text":"(1)任务序列依赖关系建模;","attrs":{}}]},{"type":"paragraph","attrs":{"indent":0,"number":0,"align":null,"origin":null}},{"type":"paragraph","attrs":{"indent":0,"number":0,"align":null,"origin":null},"content":[{"type":"text","marks":[{"type":"strong","attrs":{}}],"text":"(2)优化底层共享表示。","attrs":{}}]},{"type":"heading","attrs":{"align":null,"level":4},"content":[{"type":"text","text":"3.1 任务序列依赖关系建模","attrs":{}}]},{"type":"paragraph","attrs":{"indent":0,"number":0,"align":null,"origin":null}},{"type":"image","attrs":{"src":"https://static001.geekbang.org/infoq/9a/9afb86d28a88ef83cf66b80d3737d01d.jpeg","alt":null,"title":null,"style":[{"key":"width","value":"75%"},{"key":"bordertype","value":"none"}],"href":null,"fromPaste":true,"pastePass":true}},{"type":"paragraph","attrs":{"indent":0,"number":0,"align":"center","origin":null},"content":[{"type":"text","marks":[{"type":"size","attrs":{"size":10}}],"text":"图4:基于ESMM的方案","attrs":{}}]},{"type":"paragraph","attrs":{"indent":0,"number":0,"align":null,"origin":null}},{"type":"paragraph","attrs":{"indent":0,"number":0,"align":null,"origin":null},"content":[{"type":"text","text":"推荐场景中,用户的行为通常具有","attrs":{}},{"type":"text","marks":[{"type":"strong","attrs":{}}],"text":"序列依赖关系","attrs":{}},{"type":"text","text":",在阿里ESMM的文章[1]中,用户的","attrs":{}},{"type":"text","marks":[{"type":"strong","attrs":{}}],"text":"转化行为是发生在用户点击之后","attrs":{}},{"type":"text","text":",因此基于序列依赖进行建模。如图4所示,对比feed流场景,点击是时长或者互动的前提,可以把","attrs":{}},{"type":"text","marks":[{"type":"strong","attrs":{}}],"text":"点击&时长,或者点击&互动作为ESMM迭代的方向。","attrs":{}},{"type":"text","text":"实现上,","attrs":{}},{"type":"text","marks":[{"type":"strong","attrs":{}}],"text":"互动作为主任务,点击作为辅助任务,时长作为二者的正例权重,离线训练时两者loss直接相加。","attrs":{}},{"type":"text","text":"我们曾经尝试过对两个目标预估值进行变化以及时长更多的Label制定方式,但线上效果均持平微正。","attrs":{}}]},{"type":"paragraph","attrs":{"indent":0,"number":0,"align":null,"origin":null}},{"type":"paragraph","attrs":{"indent":0,"number":0,"align":null,"origin":null},"content":[{"type":"text","text":"小结:点击和互动没有","attrs":{}},{"type":"text","marks":[{"type":"strong","attrs":{}}],"text":"绝对的联系","attrs":{}},{"type":"text","text":",","attrs":{}},{"type":"text","marks":[{"type":"strong","attrs":{}}],"text":"点击&时长&互动,不适合ESMM应用场景;","attrs":{}},{"type":"text","text":"互动行为非常稀疏,","attrs":{}},{"type":"text","marks":[{"type":"strong","attrs":{}}],"text":"训练效果较差;","attrs":{}},{"type":"text","text":"多个目标的loss直接相加,","attrs":{}},{"type":"text","marks":[{"type":"strong","attrs":{}}],"text":"难以平衡对每个目标任务的影响","attrs":{}},{"type":"text","text":",对模型训练造成扰动;不同目标可能","attrs":{}},{"type":"text","marks":[{"type":"strong","attrs":{}}],"text":"差异较大,难以共享底层表示。","attrs":{}}]},{"type":"heading","attrs":{"align":null,"level":4},"content":[{"type":"text","text":"3.2 MMOE+帕累托优化","attrs":{}}]},{"type":"paragraph","attrs":{"indent":0,"number":0,"align":null,"origin":null}},{"type":"paragraph","attrs":{"indent":0,"number":0,"align":null,"origin":null},"content":[{"type":"text","text":"我们分别对","attrs":{}},{"type":"text","marks":[{"type":"strong","attrs":{}}],"text":"观看时长","attrs":{}},{"type":"text","text":"和评论数","attrs":{}},{"type":"text","marks":[{"type":"strong","attrs":{}}],"text":"Top 100","attrs":{}},{"type":"text","text":"的视频进行对比分析,发现","attrs":{}},{"type":"text","marks":[{"type":"strong","attrs":{}}],"text":"重合度较低、排序差异很大,强制底层共享存在冲突。","attrs":{}},{"type":"text","text":"因此,我们采用了","attrs":{}},{"type":"text","marks":[{"type":"strong","attrs":{}}],"text":"谷歌MMOE","attrs":{}},{"type":"text","text":"[2][3]的方案,但是考虑到联合Loss需要进行","attrs":{}},{"type":"text","marks":[{"type":"strong","attrs":{}}],"text":"大量超参调节","attrs":{}},{"type":"text","text":",可能出现","attrs":{}},{"type":"text","marks":[{"type":"strong","attrs":{}}],"text":"目标一涨一跌","attrs":{}},{"type":"text","text":"的现象,因此使用帕累托优化保证原有目标效果不降低的情况下,提升互动效果。","attrs":{}}]},{"type":"image","attrs":{"src":"https://static001.geekbang.org/infoq/52/5278b51fb3a093c7fb4c77f332f80383.jpeg","alt":null,"title":null,"style":[{"key":"width","value":"75%"},{"key":"bordertype","value":"none"}],"href":null,"fromPaste":true,"pastePass":true}},{"type":"paragraph","attrs":{"indent":0,"number":0,"align":"center","origin":null},"content":[{"type":"text","marks":[{"type":"size","attrs":{"size":10}}],"text":"图5 MMOE模型结构","attrs":{}}]},{"type":"paragraph","attrs":{"indent":0,"number":0,"align":null,"origin":null}},{"type":"paragraph","attrs":{"indent":0,"number":0,"align":null,"origin":null},"content":[{"type":"text","text":"MMOE模型底层通过采用","attrs":{}},{"type":"text","marks":[{"type":"strong","attrs":{}}],"text":"Soft parameter sharing","attrs":{}},{"type":"text","text":"方式,能够有效解决","attrs":{}},{"type":"text","marks":[{"type":"strong","attrs":{}}],"text":"两个任务相关性较差情况下的多任务学习。","attrs":{}}]},{"type":"paragraph","attrs":{"indent":0,"number":0,"align":null,"origin":null}},{"type":"image","attrs":{"src":"https://static001.geekbang.org/infoq/b4/b48bc67948eb261a2d2fadce3ec4c79c.jpeg","alt":null,"title":null,"style":[{"key":"width","value":"75%"},{"key":"bordertype","value":"none"}],"href":null,"fromPaste":true,"pastePass":true}},{"type":"paragraph","attrs":{"indent":0,"number":0,"align":"center","origin":null},"content":[{"type":"text","marks":[{"type":"size","attrs":{"size":10}}],"text":"图6 基于MMOE+帕累托优化的方案","attrs":{}}]},{"type":"paragraph","attrs":{"indent":0,"number":0,"align":null,"origin":null}},{"type":"paragraph","attrs":{"indent":0,"number":0,"align":null,"origin":null},"content":[{"type":"text","marks":[{"type":"strong","attrs":{}}],"text":"帕累托优化","attrs":{}},{"type":"text","text":"主要参考阿里2019年发表于RecSys上的一篇文章[4],对比手动调节联合Loss,该论文使用","attrs":{}},{"type":"text","marks":[{"type":"strong","attrs":{}}],"text":"kkt条件来负责各目标权重的生成","attrs":{}},{"type":"text","text":"。大体步骤(如图中Training虚线框内所示):","attrs":{}}]},{"type":"paragraph","attrs":{"indent":0,"number":0,"align":null,"origin":null}},{"type":"paragraph","attrs":{"indent":0,"number":0,"align":null,"origin":null},"content":[{"type":"text","text":"(1) ","attrs":{}},{"type":"text","marks":[{"type":"strong","attrs":{}}],"text":"均匀设置","attrs":{}},{"type":"text","text":"目标权重值(可更新的),同时","attrs":{}},{"type":"text","marks":[{"type":"strong","attrs":{}}],"text":"设置权重边界值超参","attrs":{}},{"type":"text","text":",运行","attrs":{}},{"type":"text","marks":[{"type":"strong","attrs":{}}],"text":"PE-LTR算法","attrs":{}},{"type":"text","text":"在训练过程中不断更新权重值;","attrs":{}}]},{"type":"paragraph","attrs":{"indent":0,"number":0,"align":null,"origin":null}},{"type":"paragraph","attrs":{"indent":0,"number":0,"align":null,"origin":null},"content":[{"type":"text","text":"(2) 通过设置","attrs":{}},{"type":"text","marks":[{"type":"strong","attrs":{}}],"text":"不同的权重边界值超参","attrs":{}},{"type":"text","text":",多次运行训练任务,根据","attrs":{}},{"type":"text","marks":[{"type":"strong","attrs":{}}],"text":"目标的重要性","attrs":{}},{"type":"text","text":"挑选效果最好的模型。","attrs":{}}]},{"type":"paragraph","attrs":{"indent":0,"number":0,"align":null,"origin":null}},{"type":"paragraph","attrs":{"indent":0,"number":0,"align":null,"origin":null},"content":[{"type":"text","marks":[{"type":"strong","attrs":{}}],"text":"线上收益:互动率提升20%,人均播放时长提升1.4%。","attrs":{}}]},{"type":"paragraph","attrs":{"indent":0,"number":0,"align":null,"origin":null}},{"type":"paragraph","attrs":{"indent":0,"number":0,"align":null,"origin":null},"content":[{"type":"text","text":"小结:实际使用中","attrs":{}},{"type":"text","marks":[{"type":"strong","attrs":{}}],"text":"权重边界值对模型效果影响较大","attrs":{}},{"type":"text","text":",需要多次调优确定;多目标权重在前期已基本收敛,","attrs":{}},{"type":"text","marks":[{"type":"strong","attrs":{}}],"text":"中后期浮动较小","attrs":{}},{"type":"text","text":";此","attrs":{}},{"type":"text","marks":[{"type":"strong","attrs":{}}],"text":"帕累托优化方案应用于离线训练","attrs":{}},{"type":"text","text":",在线服务部分仍需要其它策略。","attrs":{}}]},{"type":"heading","attrs":{"align":null,"level":3},"content":[{"type":"text","text":"4.多任务学习-融合优化","attrs":{}}]},{"type":"paragraph","attrs":{"indent":0,"number":0,"align":null,"origin":null}},{"type":"paragraph","attrs":{"indent":0,"number":0,"align":null,"origin":null},"content":[{"type":"text","text":"除了对","attrs":{}},{"type":"text","marks":[{"type":"strong","attrs":{}}],"text":"网络结构","attrs":{}},{"type":"text","text":"进行优化,我们对","attrs":{}},{"type":"text","marks":[{"type":"strong","attrs":{}}],"text":"模型推理阶段的多目标输出组合进行了优化","attrs":{}},{"type":"text","text":",同时,加入了","attrs":{}},{"type":"text","marks":[{"type":"strong","attrs":{}}],"text":"完播率","attrs":{}},{"type":"text","text":"和","attrs":{}},{"type":"text","marks":[{"type":"strong","attrs":{}}],"text":"时长目标","attrs":{}},{"type":"text","text":",模型Serving时,通过融合各预估分实现多目标的协调和折中处理,保证模型","attrs":{}},{"type":"text","marks":[{"type":"strong","attrs":{}}],"text":"对各个子目标的排序均有较好的效果。","attrs":{}},{"type":"text","text":"因此在进行多目标建模时,","attrs":{}},{"type":"text","marks":[{"type":"strong","attrs":{}}],"text":"首先优化联合Loss","attrs":{}},{"type":"text","text":",保证各目标的离线效果均较优;","attrs":{}},{"type":"text","marks":[{"type":"strong","attrs":{}}],"text":"然后对各子目标进行融合排序","attrs":{}},{"type":"text","text":",实现多目标的权衡和整体提升。","attrs":{}}]},{"type":"heading","attrs":{"align":null,"level":4},"content":[{"type":"text","text":"4.1 乘法融合升级","attrs":{}}]},{"type":"paragraph","attrs":{"indent":0,"number":0,"align":null,"origin":null}},{"type":"paragraph","attrs":{"indent":0,"number":0,"align":null,"origin":null},"content":[{"type":"text","marks":[{"type":"strong","attrs":{}}],"text":"在线推理","attrs":{}},{"type":"text","text":"时,使用可适配多种融合方案的","attrs":{}},{"type":"text","marks":[{"type":"strong","attrs":{}}],"text":"超参配置","attrs":{}},{"type":"text","text":"。在多目标融合初期,我们采用了加权和的方式。由于最终的排序得分对","attrs":{}},{"type":"text","marks":[{"type":"strong","attrs":{}}],"text":"各子目标的得分值域","attrs":{}},{"type":"text","text":"很敏感,因此我们增加α和β两个超参,来联合调节各子目标得分的","attrs":{}},{"type":"text","marks":[{"type":"strong","attrs":{}}],"text":"灵敏度与提升比例。","attrs":{}}]},{"type":"image","attrs":{"src":"https://static001.geekbang.org/infoq/42/425e18c5850201301447dcf99e044a5a.jpeg","alt":null,"title":null,"style":[{"key":"width","value":"75%"},{"key":"bordertype","value":"none"}],"href":null,"fromPaste":true,"pastePass":true}},{"type":"paragraph","attrs":{"indent":0,"number":0,"align":null,"origin":null}},{"type":"paragraph","attrs":{"indent":0,"number":0,"align":null,"origin":null}},{"type":"paragraph","attrs":{"indent":0,"number":0,"align":null,"origin":null},"content":[{"type":"text","text":"其中,αi:","attrs":{}},{"type":"text","marks":[{"type":"strong","attrs":{}}],"text":"超参,灵敏度","attrs":{}},{"type":"text","text":";scorei: ","attrs":{}},{"type":"text","marks":[{"type":"strong","attrs":{}}],"text":"模型i的输出","attrs":{}},{"type":"text","text":";βi:","attrs":{}},{"type":"text","marks":[{"type":"strong","attrs":{}}],"text":"超参,提升比例,非线性处理","attrs":{}},{"type":"text","text":";factor:","attrs":{}},{"type":"text","marks":[{"type":"strong","attrs":{}}],"text":"超参,组合权重","attrs":{}},{"type":"text","text":";n:","attrs":{}},{"type":"text","marks":[{"type":"strong","attrs":{}}],"text":"模型数量","attrs":{}},{"type":"text","text":"。","attrs":{}}]},{"type":"paragraph","attrs":{"indent":0,"number":0,"align":null,"origin":null}},{"type":"paragraph","attrs":{"indent":0,"number":0,"align":null,"origin":null},"content":[{"type":"text","text":"在业务的目标较少时,通过","attrs":{}},{"type":"text","marks":[{"type":"strong","attrs":{}}],"text":"加法方式","attrs":{}},{"type":"text","text":"融合新增目标可以短期内","attrs":{}},{"type":"text","marks":[{"type":"strong","attrs":{}}],"text":"快速获得收益","attrs":{}},{"type":"text","text":"。但随着","attrs":{}},{"type":"text","marks":[{"type":"strong","attrs":{}}],"text":"目标逐渐增多时,加法的融合排序能力会逐渐受限","attrs":{}},{"type":"text","text":"。主要包括:","attrs":{}}]},{"type":"paragraph","attrs":{"indent":0,"number":0,"align":null,"origin":null}},{"type":"paragraph","attrs":{"indent":0,"number":0,"align":null,"origin":null},"content":[{"type":"text","text":"(1)对于","attrs":{}},{"type":"text","marks":[{"type":"strong","attrs":{}}],"text":"新增目标","attrs":{}},{"type":"text","text":",","attrs":{}},{"type":"text","marks":[{"type":"strong","attrs":{}}],"text":"乘法融合具有一定的目标独立性","attrs":{}},{"type":"text","text":",无需考虑旧目标集的值域分布;","attrs":{}}]},{"type":"paragraph","attrs":{"indent":0,"number":0,"align":null,"origin":null}},{"type":"paragraph","attrs":{"indent":0,"number":0,"align":null,"origin":null},"content":[{"type":"text","text":"(2)随着目标逐渐增多,","attrs":{}},{"type":"text","marks":[{"type":"strong","attrs":{}}],"text":"加法融合会逐步弱化各子目标的重要性影响。","attrs":{}}]},{"type":"paragraph","attrs":{"indent":0,"number":0,"align":null,"origin":null}},{"type":"paragraph","attrs":{"indent":0,"number":0,"align":null,"origin":null},"content":[{"type":"text","text":"因此我们对多目标的融合方式升级为乘法:","attrs":{}}]},{"type":"image","attrs":{"src":"https://static001.geekbang.org/infoq/f7/f7d67389810014fc89a43a10e649d42f.jpeg","alt":null,"title":null,"style":[{"key":"width","value":"75%"},{"key":"bordertype","value":"none"}],"href":null,"fromPaste":true,"pastePass":true}},{"type":"paragraph","attrs":{"indent":0,"number":0,"align":null,"origin":null}},{"type":"paragraph","attrs":{"indent":0,"number":0,"align":null,"origin":null},"content":[{"type":"text","marks":[{"type":"strong","attrs":{}}],"text":"线上收益:CTR提升1.5%,人均播放时长提升1%。","attrs":{}}]},{"type":"heading","attrs":{"align":null,"level":4},"content":[{"type":"text","text":"4.2任务序列依赖关系建模","attrs":{}}]},{"type":"paragraph","attrs":{"indent":0,"number":0,"align":null,"origin":null}},{"type":"paragraph","attrs":{"indent":0,"number":0,"align":null,"origin":null},"content":[{"type":"text","text":"为了提升短视频的","attrs":{}},{"type":"text","marks":[{"type":"strong","attrs":{}}],"text":"播放渗透","attrs":{}},{"type":"text","text":",促使用户","attrs":{}},{"type":"text","marks":[{"type":"strong","attrs":{}}],"text":"深度消费","attrs":{}},{"type":"text","text":",我们新构造了","attrs":{}},{"type":"text","marks":[{"type":"strong","attrs":{}}],"text":"三个目标:","attrs":{}}]},{"type":"paragraph","attrs":{"indent":0,"number":0,"align":null,"origin":null}},{"type":"paragraph","attrs":{"indent":0,"number":0,"align":null,"origin":null},"content":[{"type":"text","text":"(1)","attrs":{}},{"type":"text","marks":[{"type":"strong","attrs":{}}],"text":"通过限定完播率阈值构造完播二分类目标","attrs":{}},{"type":"text","text":",以近似满足逻辑回归的假设条件;","attrs":{}}]},{"type":"paragraph","attrs":{"indent":0,"number":0,"align":null,"origin":null}},{"type":"paragraph","attrs":{"indent":0,"number":0,"align":null,"origin":null},"content":[{"type":"text","text":"(2)","attrs":{}},{"type":"text","marks":[{"type":"strong","attrs":{}}],"text":"拟合平滑后的播放时长作为回归目标;","attrs":{}}]},{"type":"paragraph","attrs":{"indent":0,"number":0,"align":null,"origin":null}},{"type":"paragraph","attrs":{"indent":0,"number":0,"align":null,"origin":null},"content":[{"type":"text","text":"(3)","attrs":{}},{"type":"text","marks":[{"type":"strong","attrs":{}}],"text":"限定播放时长阈值","attrs":{}},{"type":"text","text":",构建有效播放的二分类目标。","attrs":{}}]},{"type":"paragraph","attrs":{"indent":0,"number":0,"align":null,"origin":null}},{"type":"paragraph","attrs":{"indent":0,"number":0,"align":null,"origin":null},"content":[{"type":"text","text":"对于","attrs":{}},{"type":"text","marks":[{"type":"strong","attrs":{}}],"text":"回归目标","attrs":{}},{"type":"text","text":",采用","attrs":{}},{"type":"text","marks":[{"type":"strong","attrs":{}}],"text":"正逆序对比(PNR,positive-negative-ration)","attrs":{}},{"type":"text","text":"来评估多目标预估值融合后的排序效果。最终在随刻首页feed流和爱奇艺沉浸式场景中均取得","attrs":{}},{"type":"text","marks":[{"type":"strong","attrs":{}}],"text":"播放量和人均时长的显著提升。","attrs":{}}]},{"type":"paragraph","attrs":{"indent":0,"number":0,"align":null,"origin":null}},{"type":"paragraph","attrs":{"indent":0,"number":0,"align":null,"origin":null},"content":[{"type":"text","marks":[{"type":"strong","attrs":{}}],"text":"线上收益:UCTR提升1%,CTR提升3%,人均播放时长提升0.6%。","attrs":{}}]},{"type":"heading","attrs":{"align":null,"level":4},"content":[{"type":"text","text":"4.3 PSO[5]进化优化算法","attrs":{}}]},{"type":"paragraph","attrs":{"indent":0,"number":0,"align":null,"origin":null}},{"type":"paragraph","attrs":{"indent":0,"number":0,"align":null,"origin":null},"content":[{"type":"text","text":"无论对预估分使用加法还是乘法方式融合,模型Serving时的超参均是通过","attrs":{}},{"type":"text","marks":[{"type":"strong","attrs":{}}],"text":"Grid Search","attrs":{}},{"type":"text","text":"得到离线较优的几组解。需要","attrs":{}},{"type":"text","marks":[{"type":"strong","attrs":{}}],"text":"离线搜参","attrs":{}},{"type":"text","text":"以及","attrs":{}},{"type":"text","marks":[{"type":"strong","attrs":{}}],"text":"线上AB","attrs":{}},{"type":"text","text":"才能最终确定,","attrs":{}},{"type":"text","marks":[{"type":"strong","attrs":{}}],"text":"效率较低","attrs":{}},{"type":"text","text":"。随着模型的迭代和样本分布的改变,最优解也在变。因此我们借鉴了多目标进化优化算法的思路,基于","attrs":{}},{"type":"text","marks":[{"type":"strong","attrs":{}}],"text":"启发式的粒子群算法(PSO,Particle Swarm Optimization)","attrs":{}},{"type":"text","text":"搜索融合参数,逼近","attrs":{}},{"type":"text","marks":[{"type":"strong","attrs":{}}],"text":"多目标的Pareto前沿","attrs":{}},{"type":"text","text":"。","attrs":{}}]},{"type":"paragraph","attrs":{"indent":0,"number":0,"align":null,"origin":null}},{"type":"paragraph","attrs":{"indent":0,"number":0,"align":null,"origin":null},"content":[{"type":"text","text":"PSO算法通过初始化一群随机粒子,启发式地多次迭代求出最优解。每一次迭代,粒子通过","attrs":{}},{"type":"text","marks":[{"type":"strong","attrs":{}}],"text":"个体极值(该粒子所经过的最优解)和群体极值(种群找到的最优解)","attrs":{}},{"type":"text","text":"来更新各自位置。","attrs":{}},{"type":"text","marks":[{"type":"strong","attrs":{}}],"text":"最终所有粒子会兼顾个体的历史最优和群体共享的全局最优直至收敛。","attrs":{}}]},{"type":"paragraph","attrs":{"indent":0,"number":0,"align":null,"origin":null}},{"type":"paragraph","attrs":{"indent":0,"number":0,"align":null,"origin":null},"content":[{"type":"text","text":"基于PSO算法进行","attrs":{}},{"type":"text","marks":[{"type":"strong","attrs":{}}],"text":"多目标搜参","attrs":{}},{"type":"text","text":",","attrs":{}},{"type":"text","marks":[{"type":"strong","attrs":{}}],"text":"首先初始化参数","attrs":{}},{"type":"text","text":";通过","attrs":{}},{"type":"text","marks":[{"type":"strong","attrs":{}}],"text":"乘法融合","attrs":{}},{"type":"text","text":"得到每个视频最终的","attrs":{}},{"type":"text","marks":[{"type":"strong","attrs":{}}],"text":"排序分","attrs":{}},{"type":"text","text":",","attrs":{}},{"type":"text","marks":[{"type":"strong","attrs":{}}],"text":"并计算各子目标的AUC","attrs":{}},{"type":"text","text":";根据指标的重要性对","attrs":{}},{"type":"text","marks":[{"type":"strong","attrs":{}}],"text":"完播率分类的AUC、播放时长的PNR等确定权重","attrs":{}},{"type":"text","text":",定义","attrs":{}},{"type":"text","marks":[{"type":"strong","attrs":{}}],"text":"总的优化目标:","attrs":{}}]},{"type":"image","attrs":{"src":"https://static001.geekbang.org/infoq/a0/a0ac3061fc833323fe38873d36e36f83.jpeg","alt":null,"title":null,"style":[{"key":"width","value":"75%"},{"key":"bordertype","value":"none"}],"href":null,"fromPaste":true,"pastePass":true}},{"type":"paragraph","attrs":{"indent":0,"number":0,"align":null,"origin":null}},{"type":"paragraph","attrs":{"indent":0,"number":0,"align":null,"origin":null},"content":[{"type":"text","text":"最后通过","attrs":{}},{"type":"text","marks":[{"type":"strong","attrs":{}}],"text":"持续迭代","attrs":{}},{"type":"text","text":",使得","attrs":{}},{"type":"text","marks":[{"type":"strong","attrs":{}}],"text":"总评估目标Obj最大","attrs":{}},{"type":"text","text":",即得到","attrs":{}},{"type":"text","marks":[{"type":"strong","attrs":{}}],"text":"各子目标的超参数α、β","attrs":{}},{"type":"text","text":"。图7为总目标得分Obj随迭代步数的收敛曲线。","attrs":{}}]},{"type":"paragraph","attrs":{"indent":0,"number":0,"align":null,"origin":null}},{"type":"image","attrs":{"src":"https://static001.geekbang.org/infoq/61/61d6c279f489e958965a8b1634ac158b.jpeg","alt":null,"title":null,"style":[{"key":"width","value":"75%"},{"key":"bordertype","value":"none"}],"href":null,"fromPaste":true,"pastePass":true}},{"type":"paragraph","attrs":{"indent":0,"number":0,"align":"center","origin":null},"content":[{"type":"text","marks":[{"type":"size","attrs":{"size":10}}],"text":"图7:总目标得分的收敛曲线","attrs":{}}]},{"type":"paragraph","attrs":{"indent":0,"number":0,"align":null,"origin":null}},{"type":"paragraph","attrs":{"indent":0,"number":0,"align":null,"origin":null},"content":[{"type":"text","text":"搜参任务需要保证","attrs":{}},{"type":"text","marks":[{"type":"strong","attrs":{}}],"text":"总目标的定义足够完美","attrs":{}},{"type":"text","text":",保证粒子的","attrs":{}},{"type":"text","marks":[{"type":"strong","attrs":{}}],"text":"优化方向不至于被某个子目标带偏","attrs":{}},{"type":"text","text":",此外验证集的","attrs":{}},{"type":"text","marks":[{"type":"strong","attrs":{}}],"text":"无偏性和一致性","attrs":{}},{"type":"text","text":"也是效果一致的重要保证。进一步地我们将PSO搜参过程","attrs":{}},{"type":"text","marks":[{"type":"strong","attrs":{}}],"text":"部署到集群","attrs":{}},{"type":"text","text":",","attrs":{}},{"type":"text","marks":[{"type":"strong","attrs":{}}],"text":"实现模型和融合参数的同步更新,大幅降低人工调参的成本。","attrs":{}}]},{"type":"paragraph","attrs":{"indent":0,"number":0,"align":null,"origin":null}},{"type":"paragraph","attrs":{"indent":0,"number":0,"align":null,"origin":null},"content":[{"type":"text","text":"小结:无论融合方式的升级还是搜参方式的优化,均是","attrs":{}},{"type":"text","marks":[{"type":"strong","attrs":{}}],"text":"离线搜参后部署到线上生效。","attrs":{}},{"type":"text","text":"受","attrs":{}},{"type":"text","marks":[{"type":"strong","attrs":{}}],"text":"场景、运营流量","attrs":{}},{"type":"text","text":"等影响,","attrs":{}},{"type":"text","marks":[{"type":"strong","attrs":{}}],"text":"离线指标和业务指标存在gap。","attrs":{}},{"type":"text","text":"离线寻参容易获得","attrs":{}},{"type":"text","marks":[{"type":"strong","attrs":{}}],"text":"短期收益","attrs":{}},{"type":"text","text":",但","attrs":{}},{"type":"text","marks":[{"type":"strong","attrs":{}}],"text":"无法动态调整","attrs":{}},{"type":"text","text":"及时适应样本分布的变化。后续结合用户的","attrs":{}},{"type":"text","marks":[{"type":"strong","attrs":{}}],"text":"实时日志、特征","attrs":{}},{"type":"text","text":"等,对","attrs":{}},{"type":"text","marks":[{"type":"strong","attrs":{}}],"text":"在线自动搜参","attrs":{}},{"type":"text","text":"展开持续探索;以及","attrs":{}},{"type":"text","marks":[{"type":"strong","attrs":{}}],"text":"模型化拟合参数","attrs":{}},{"type":"text","text":",尝试提升个性化和实时性。","attrs":{}}]},{"type":"heading","attrs":{"align":null,"level":2},"content":[{"type":"text","text":"03 总结与展望","attrs":{}}]},{"type":"paragraph","attrs":{"indent":0,"number":0,"align":null,"origin":null}},{"type":"paragraph","attrs":{"indent":0,"number":0,"align":null,"origin":null},"content":[{"type":"text","text":"本文总结了","attrs":{}},{"type":"text","marks":[{"type":"strong","attrs":{}}],"text":"爱奇艺短视频推荐技术排序阶段多目标的优化","attrs":{}},{"type":"text","text":",对","attrs":{}},{"type":"text","marks":[{"type":"strong","attrs":{}}],"text":"样本权重优化","attrs":{}},{"type":"text","text":"到","attrs":{}},{"type":"text","marks":[{"type":"strong","attrs":{}}],"text":"模型结构、多目标融合","attrs":{}},{"type":"text","text":"等多角度进行了一系列的探索和实践,","attrs":{}},{"type":"text","marks":[{"type":"strong","attrs":{}}],"text":"在线上取得了一系列的收益","attrs":{}},{"type":"text","text":"。后续,我们将会从","attrs":{}},{"type":"text","marks":[{"type":"strong","attrs":{}}],"text":"3个方向继续探索:","attrs":{}}]},{"type":"paragraph","attrs":{"indent":0,"number":0,"align":null,"origin":null}},{"type":"paragraph","attrs":{"indent":0,"number":0,"align":null,"origin":null},"content":[{"type":"text","text":"(1)","attrs":{}},{"type":"text","marks":[{"type":"strong","attrs":{}}],"text":"跨场景的多目标学习","attrs":{}},{"type":"text","text":":结合多场景的数据学习用户兴趣,优化主/辅助任务,并应用到更多场景中;","attrs":{}}]},{"type":"paragraph","attrs":{"indent":0,"number":0,"align":null,"origin":null}},{"type":"paragraph","attrs":{"indent":0,"number":0,"align":null,"origin":null},"content":[{"type":"text","text":"(2)","attrs":{}},{"type":"text","marks":[{"type":"strong","attrs":{}}],"text":"优化模型","attrs":{}},{"type":"text","text":":包括梯度优化、底层共享的设计、Loss设计、不同任务对梯度的影响等;","attrs":{}}]},{"type":"paragraph","attrs":{"indent":0,"number":0,"align":null,"origin":null}},{"type":"paragraph","attrs":{"indent":0,"number":0,"align":null,"origin":null},"content":[{"type":"text","text":"(3)","attrs":{}},{"type":"text","marks":[{"type":"strong","attrs":{}}],"text":"在线搜参","attrs":{}},{"type":"text","text":":开发自动调参框架,利用一部分流量进行探索,实时动态调整等。","attrs":{}}]},{"type":"paragraph","attrs":{"indent":0,"number":0,"align":null,"origin":null}},{"type":"paragraph","attrs":{"indent":0,"number":0,"align":null,"origin":null},"content":[{"type":"text","marks":[{"type":"strong","attrs":{}}],"text":"参考文献","attrs":{}}]},{"type":"paragraph","attrs":{"indent":0,"number":0,"align":null,"origin":null}},{"type":"paragraph","attrs":{"indent":0,"number":0,"align":null,"origin":null},"content":[{"type":"text","text":"[1] Ma X, Zhao L, Huang G, et al. Entire space multi-task model: An effective approach for estimating post-click conversion rate[C]//The 41st International ACM SIGIR Conference on Research & Development in Information Retrieval. 2018: 1137-1140.","attrs":{}}]},{"type":"paragraph","attrs":{"indent":0,"number":0,"align":null,"origin":null},"content":[{"type":"text","text":"[2] Ma J, Zhao Z, Yi X, et al. Modeling task relationships in multi-task learning with multi-gate mixture-of-experts[C]//Proceedings of the 24th ACM SIGKDD International Conference on Knowledge Discovery & Data Mining. 2018: 1930-1939.","attrs":{}}]},{"type":"paragraph","attrs":{"indent":0,"number":0,"align":null,"origin":null},"content":[{"type":"text","text":"[3] Zhao Z, Hong L, Wei L, et al. Recommending what video to watch next: a multitask ranking system[C]//Proceedings of the 13th ACM Conference on Recommender Systems. 2019: 43-51.","attrs":{}}]},{"type":"paragraph","attrs":{"indent":0,"number":0,"align":null,"origin":null},"content":[{"type":"text","text":"[4] Lin X, Chen H, Pei C, et al. A pareto-efficient algorithm for multiple objective optimization in e-commerce recommendation[C]//Proceedings of the 13th ACM Conference on Recommender Systems. 2019: 20-28.","attrs":{}}]},{"type":"paragraph","attrs":{"indent":0,"number":0,"align":null,"origin":null},"content":[{"type":"text","text":"[5] Kennedy J, Eberhart R. Particle swarm optimization[C]//Proceedings of ICNN'95-international conference on neural networks. IEEE, 1995, 4: 1942-1948.","attrs":{}}]}]}
發表評論
所有評論
還沒有人評論,想成為第一個評論的人麼? 請在上方評論欄輸入並且點擊發布.
相關文章