[{"data":1,"prerenderedAt":387},["ShallowReactive",2],{"publication-2024\u002Fcard-semantic-segmentation-with-efficient-class-aware-regularized-decoder-en":3,"publication-members":74},{"_path":4,"_dir":5,"_draft":6,"_partial":6,"_locale":7,"title":8,"description":9,"_hidden":6,"authors":10,"authors_orcid":19,"year":28,"doi":29,"openalex_id":30,"venue":31,"abstract_screenshot":32,"keywords":33,"body":43,"_type":67,"_id":68,"_source":69,"_file":70,"_stem":71,"_extension":72,"locale":73},"\u002Fpublications\u002F2024\u002Fcard-semantic-segmentation-with-efficient-class-aware-regularized-decoder","2024",false,"","CARD: Semantic Segmentation With Efficient Class-Aware Regularized Decoder","Semantic segmentation has recently achieved notable advances by exploiting “class-level” contextual information during learning, e.g., the Object Contextual Representation (OCR) and Context Prior (CPNet) approaches. However, these approaches simply concatenate class-level information to pixel features to boost pixel representation learning, which cannot fully utilize intra-class and inter-class contextual information. Moreover, these approaches learn soft class centers based on coarse mask prediction, which is prone to error accumulation. To better exploit class-level information, we propose a universal Class-Aware Regularization (CAR) approach to optimize the intra-class variance and inter-class distance during feature learning, motivated by the fact that humans can recognize an object by itself no matter which other objects it appears with. Moreover, we design a dedicated decoder for CAR (named CARD), which consists of a novel spatial token mixer and an upsampling module, to maximize its gain for existing baselines while being highly efficient in terms of computational cost. Specifically, CAR consists of three novel loss functions. The first loss function encourages more compact class representations within each class, the second directly maximizes the distance between different class centers, and the third further pushes the distance between inter-class centers and pixels. Furthermore, the class center in our approach is directly generated from ground truth instead of from the error-prone coarse prediction. CAR can be directly applied to most existing segmentation models during training, including OCR and CPNet, and can largely improve their accuracy at no additional inference overhead. Extensive experiments and ablation studies conducted on multiple benchmark datasets demonstrate that the proposed CAR can boost the accuracy of all baseline models by up to 2.23% mIOU with superior generalization ability. CARD outperforms state-of-the-art approaches on multiple benchmarks with a highly efficient architecture. The code will be available at https:\u002F\u002Fgithub.com\u002Fedwardyehuang\u002FCAR.",[11,12,13,14,15,16,17,18],"Huang, Ye","Kang, Di","Chen, Liang","Jia, Wenjing","He, Xiangjian","Duan, Lixin","Zhe, Xuefei","Bao, Linchao",[20,21,22,23,24,25,26,27],"0000-0001-5668-5529","0000-0002-8996-0897","0000-0003-0712-4738","0000-0002-0940-3338","0000-0001-8962-540X","0000-0002-0723-4016","0000-0002-5005-7166","0000-0001-9543-3754",2024,"https:\u002F\u002Fdoi.org\u002F10.1109\u002Ftcsvt.2024.3395132","W4396214386","IEEE Transactions on Circuits and Systems for Video Technology",null,[34,35,36,37,38,39,40,41,42],"Computer science","Class (philosophy)","Segmentation","Artificial intelligence","Natural language processing","Semantics (computer science)","Image segmentation","Pattern recognition (psychology)","Programming language",{"type":44,"children":45,"toc":64},"root",[46],{"type":47,"tag":48,"props":49,"children":50},"element","p",{},[51,54,62],{"type":52,"value":53},"text","Semantic segmentation has recently achieved notable advances by exploiting “class-level” contextual information during learning, e.g., the Object Contextual Representation (OCR) and Context Prior (CPNet) approaches. However, these approaches simply concatenate class-level information to pixel features to boost pixel representation learning, which cannot fully utilize intra-class and inter-class contextual information. Moreover, these approaches learn soft class centers based on coarse mask prediction, which is prone to error accumulation. To better exploit class-level information, we propose a universal Class-Aware Regularization (CAR) approach to optimize the intra-class variance and inter-class distance during feature learning, motivated by the fact that humans can recognize an object by itself no matter which other objects it appears with. Moreover, we design a dedicated decoder for CAR (named CARD), which consists of a novel spatial token mixer and an upsampling module, to maximize its gain for existing baselines while being highly efficient in terms of computational cost. Specifically, CAR consists of three novel loss functions. The first loss function encourages more compact class representations within each class, the second directly maximizes the distance between different class centers, and the third further pushes the distance between inter-class centers and pixels. Furthermore, the class center in our approach is directly generated from ground truth instead of from the error-prone coarse prediction. CAR can be directly applied to most existing segmentation models during training, including OCR and CPNet, and can largely improve their accuracy at no additional inference overhead. Extensive experiments and ablation studies conducted on multiple benchmark datasets demonstrate that the proposed CAR can boost the accuracy of all baseline models by up to 2.23% mIOU with superior generalization ability. CARD outperforms state-of-the-art approaches on multiple benchmarks with a highly efficient architecture. The code will be available at ",{"type":47,"tag":55,"props":56,"children":60},"a",{"href":57,"rel":58},"https:\u002F\u002Fgithub.com\u002Fedwardyehuang\u002FCAR",[59],"nofollow",[61],{"type":52,"value":57},{"type":52,"value":63},".",{"title":7,"searchDepth":65,"depth":65,"links":66},2,[],"markdown","content:publications:2024:card-semantic-segmentation-with-efficient-class-aware-regularized-decoder.md","content","publications\u002F2024\u002Fcard-semantic-segmentation-with-efficient-class-aware-regularized-decoder.md","publications\u002F2024\u002Fcard-semantic-segmentation-with-efficient-class-aware-regularized-decoder","md","en",[75,88,93,104,111,119,125,134,141,147,152,162,169,178,184,196,205,214,220,228,233,241,247,255,259,269,276,284,289,298,304,312,318,326,331,337,347,355,361,369,374,382],{"_path":76,"title":77,"name":78,"role":79,"email":32,"image":80,"category":81,"interests":82,"order":65,"_id":87},"\u002Fmembers\u002Fstaff\u002Falain-chong","Vice President for Global Affairs and Partnerships · Professor of Information Systems and Digital Innovation","Alain Chong","Deputy Director of Lab","assets\u002F8.png","staff",[83,84,85,86],"信息系统与运作管理","计算机科学与运筹学","Information Systems and Operations Management","Computer Science and Operations Research","content:members:staff:alain-chong.md",{"_path":76,"title":89,"role":90,"interests":91,"_id":92},"全球事务与合作副校长 · 信息系统与数字创新教授","实验室副主任",[83,84],"content:members:staff:alain-chong.zh-CN.md",{"_path":94,"title":95,"name":96,"role":97,"email":32,"image":98,"category":81,"interests":99,"order":102,"_id":103},"\u002Fmembers\u002Fstaff\u002Fanthony-belloti","Professor","Anthony Belloti","Core Member","assets\u002F41.png",[100,101],"Machine Learning and Credit Risk Model","Model Risks",9,"content:members:staff:anthony-belloti.md",{"_path":94,"title":105,"role":106,"interests":107,"_id":110},"计算机科学系教授","核心成员",[108,109],"机器学习与信用风险模型","模型风险","content:members:staff:anthony-belloti.zh-CN.md",{"_path":112,"title":113,"name":113,"role":97,"email":32,"image":114,"category":81,"interests":115,"order":117,"_id":118},"\u002Fmembers\u002Fstaff\u002Fboon-giin-lee","Boon Giin Lee","assets\u002F31.jpg",[116],"Intelligent Sensor and Extended Reality",11,"content:members:staff:boon-giin-lee.md",{"_path":112,"title":120,"role":106,"interests":121,"_id":124},"人机交互实验室负责人 · 计算机科学系副教授",[122,123],"人机交互 HCI","智能传感与扩展现实技术","content:members:staff:boon-giin-lee.zh-CN.md",{"_path":126,"title":127,"name":127,"role":128,"email":32,"image":129,"category":81,"interests":130,"order":132,"_id":133},"\u002Fmembers\u002Fstaff\u002Fcong-cao","Cong Cao","Direction Leader","assets\u002FCC.png",[131],"Science and technology policy and institutional reform",7,"content:members:staff:cong-cao.md",{"_path":126,"title":135,"name":136,"role":137,"interests":138,"_id":140},"宁波诺丁汉大学商学院创新学教授","曹聪","方向带头人",[139],"科技政策与体制改革","content:members:staff:cong-cao.zh-CN.md",{"_path":142,"title":143,"name":143,"role":97,"email":32,"image":144,"category":81,"order":145,"_id":146},"\u002Fmembers\u002Fstaff\u002Fdave-towey","Dave Towey","assets\u002F32.jpg",8,"content:members:staff:dave-towey.md",{"_path":142,"title":148,"role":106,"interests":149,"_id":151},"计算机科学系教授 · 计算机科学系主任",[150],"计算机科学与语言学","content:members:staff:dave-towey.zh-CN.md",{"_path":153,"title":154,"name":154,"role":97,"email":32,"image":155,"category":81,"interests":156,"order":160,"_id":161},"\u002Fmembers\u002Fstaff\u002Ffazl-ullah-khan","Fazl Ullah Khan","assets\u002F44.png",[157,158,159],"Computer Network","Computer Architecture and Network Security","Software Engineering",12,"content:members:staff:fazl-ullah-khan.md",{"_path":153,"title":163,"role":106,"interests":164,"_id":168},"计算机科学系助理教授 · IEEE 高级会员",[165,166,167],"计算机网络","计算机和网络安全","软件工程","content:members:staff:fazl-ullah-khan.zh-CN.md",{"_path":170,"title":171,"name":172,"role":97,"email":32,"image":173,"category":81,"interests":174,"order":176,"_id":177},"\u002Fmembers\u002Fstaff\u002Fheng-yu","Associate Professor","Heng Yu","assets\u002FHENGYU.png",[175],"Embedded Systems Design",17,"content:members:staff:heng-yu.md",{"_path":170,"title":179,"name":180,"role":106,"interests":181,"_id":183},"计算机科学系副教授","于恒",[182],"嵌入式系统设计","content:members:staff:heng-yu.zh-CN.md",{"_path":185,"title":171,"name":186,"role":97,"email":32,"image":187,"category":81,"interests":188,"order":194,"_id":195},"\u002Fmembers\u002Fstaff\u002Fheshan-du","Heshan Du","assets\u002Fhesahndu.png",[189,190,191,192,193],"Logic, Knowledge Representation and Reasoning","Geographic Information Systems","Operations Research","Machine Learning","Reinforcement Learning",20,"content:members:staff:heshan-du.md",{"_path":185,"title":179,"name":197,"role":106,"interests":198,"_id":204},"杜何珊",[199,200,201,202,203],"逻辑与知识表示","地理信息系统","运筹学","机器学习","强化学习","content:members:staff:heshan-du.zh-CN.md",{"_path":206,"title":207,"name":208,"role":97,"email":32,"image":209,"category":81,"interests":210,"order":212,"_id":213},"\u002Fmembers\u002Fstaff\u002Fhuan-jin","Assistant Professor","Huan Jin","assets\u002Fhuanjin.png",[211,192],"Optimisation",21,"content:members:staff:huan-jin.md",{"_path":206,"title":215,"name":216,"role":106,"interests":217,"_id":219},"计算机科学系助理教授","靳欢",[218,202],"优化","content:members:staff:huan-jin.zh-CN.md",{"_path":221,"title":171,"name":222,"role":128,"email":32,"image":223,"category":81,"interests":224,"order":226,"_id":227},"\u002Fmembers\u002Fstaff\u002Fjianfeng-ren","Jianfeng Ren","assets\u002F42.jpg",[192,225],"Computer Vision",3,"content:members:staff:jianfeng-ren.md",{"_path":221,"title":179,"name":229,"role":137,"interests":230,"_id":232},"任剑锋",[202,231],"计算机视觉","content:members:staff:jianfeng-ren.zh-CN.md",{"_path":234,"title":235,"name":235,"role":128,"email":32,"image":236,"category":81,"interests":237,"order":239,"_id":240},"\u002Fmembers\u002Fstaff\u002Fjiawei-li","Jiawei Li","assets\u002F11.png",[238],"Computer Science and Artificial Intelligence",15,"content:members:staff:jiawei-li.md",{"_path":234,"title":242,"name":243,"role":137,"interests":244,"_id":246},"计算机科学系助理教授 · 英国诺丁汉大学博士后","李家炜",[245],"计算机与人工智能","content:members:staff:jiawei-li.zh-CN.md",{"_path":248,"title":171,"name":249,"role":97,"email":32,"image":250,"category":81,"interests":251,"order":253,"_id":254},"\u002Fmembers\u002Fstaff\u002Fmatthew-pike","Matthew Pike","assets\u002F43.jpg",[252],"Digitalised Learning",16,"content:members:staff:matthew-pike.md",{"_path":248,"title":179,"role":106,"interests":256,"_id":258},[257],"数字化学习","content:members:staff:matthew-pike.zh-CN.md",{"_path":260,"title":207,"name":261,"role":97,"email":32,"image":262,"category":81,"interests":263,"order":267,"_id":268},"\u002Fmembers\u002Fstaff\u002Fning-xue","Ning Xue","\u002Fimages\u002Fuon-logo.png",[264,265,266],"Artificial Intelligence","Computational Intelligence","Combinatorial Optimization",13,"content:members:staff:ning-xue.md",{"_path":260,"title":215,"name":270,"role":106,"interests":271,"_id":275},"薛宁",[272,273,274],"人工智能","计算智能","组合优化","content:members:staff:ning-xue.zh-CN.md",{"_path":277,"title":207,"name":278,"role":97,"email":32,"image":279,"category":81,"interests":280,"order":282,"_id":283},"\u002Fmembers\u002Fstaff\u002Fqian-zhang","Qian Zhang","assets\u002Fqz.png",[281,225,192],"Image Processing",14,"content:members:staff:qian-zhang.md",{"_path":277,"title":215,"name":285,"role":106,"interests":286,"_id":288},"张茜",[287,231,202],"图像处理","content:members:staff:qian-zhang.zh-CN.md",{"_path":290,"title":95,"name":291,"role":292,"email":32,"image":293,"category":81,"interests":294,"orcid":295,"order":296,"_id":297},"\u002Fmembers\u002Fstaff\u002Fruibin-bai","Ruibin Bai","Director of Lab","assets\u002F38.png",[86],"0000-0003-1722-568X",1,"content:members:staff:ruibin-bai.md",{"_path":290,"title":299,"name":300,"role":301,"interests":302,"_id":303},"教授","白瑞斌","实验室主任",[84],"content:members:staff:ruibin-bai.zh-CN.md",{"_path":305,"title":306,"name":306,"role":128,"email":32,"image":307,"category":81,"interests":308,"order":310,"_id":311},"\u002Fmembers\u002Fstaff\u002Fsean-he","Sean He","assets\u002F39.png",[225,309,192],"Data Analytics",5,"content:members:staff:sean-he.md",{"_path":305,"title":313,"name":314,"role":137,"interests":315,"_id":317},"计算机科学系教授 · 国家级讲席学者","何祥健",[231,316,202],"数据分析","content:members:staff:sean-he.zh-CN.md",{"_path":319,"title":320,"name":320,"role":97,"email":32,"image":321,"category":81,"interests":322,"order":324,"_id":325},"\u002Fmembers\u002Fstaff\u002Ftianxiang-cui","Tianxiang Cui","assets\u002Ftianxiangcui.png",[265,323,192,193],"Operation Research",19,"content:members:staff:tianxiang-cui.md",{"_path":319,"title":163,"name":327,"role":106,"interests":328,"_id":330},"崔天翔",[273,329,202,203],"运筹研究","content:members:staff:tianxiang-cui.zh-CN.md",{"_path":332,"title":95,"name":333,"role":97,"email":32,"image":334,"category":81,"order":335,"_id":336},"\u002Fmembers\u002Fstaff\u002Fxiuping-hua","Xiuping Hua","assets\u002FxiupignHua.png",10,"content:members:staff:xiuping-hua.md",{"_path":332,"title":338,"name":339,"role":106,"interests":340,"_id":346},"金融、会计与经济系教授","华秀萍",[341,342,343,344,345,108],"资产定价","公司金融","衍生品","金融科技","创新金融和普惠金融","content:members:staff:xiuping-hua.zh-CN.md",{"_path":348,"title":95,"name":349,"role":97,"email":32,"image":350,"category":81,"interests":351,"order":353,"_id":354},"\u002Fmembers\u002Fstaff\u002Fying-weng","Ying Weng","assets\u002Fyingweng.png",[225,281,352],"IoT",4,"content:members:staff:ying-weng.md",{"_path":348,"title":105,"name":356,"role":106,"interests":357,"_id":360},"翁莹",[231,287,358,359],"物联网 IoT","无线网络安全与服务质量","content:members:staff:ying-weng.zh-CN.md",{"_path":362,"title":207,"name":363,"role":97,"email":32,"image":364,"category":81,"interests":365,"order":367,"_id":368},"\u002Fmembers\u002Fstaff\u002Fyuan-yao","Yuan Yao","assets\u002Fyuanyao.png",[366],"Autonomous Agents and Multi-Agent Systems",18,"content:members:staff:yuan-yao.md",{"_path":362,"title":215,"name":370,"role":106,"interests":371,"_id":373},"姚远",[372],"自主智能体与多智能体系统","content:members:staff:yuan-yao.zh-CN.md",{"_path":375,"title":207,"name":376,"role":128,"email":32,"image":377,"category":81,"interests":378,"order":380,"_id":381},"\u002Fmembers\u002Fstaff\u002Fzheng-lu","Zheng Lu","assets\u002F13.png",[379],"Computer Science",6,"content:members:staff:zheng-lu.md",{"_path":375,"title":215,"name":383,"role":137,"interests":384,"_id":386},"卢正",[385],"计算机科学","content:members:staff:zheng-lu.zh-CN.md",1782639595233]