{"id":793,"date":"2022-12-01T21:10:16","date_gmt":"2022-12-01T13:10:16","guid":{"rendered":"https:\/\/511cvlab.sinkers.cn\/?p=793"},"modified":"2025-10-17T17:06:41","modified_gmt":"2025-10-17T09:06:41","slug":"dsf","status":"publish","type":"post","link":"https:\/\/cv.nirc.top\/zh\/2022\/dsf\/","title":{"rendered":"A Dual-Branch Self-Boosting Framework for Self-Supervised 3D Hand Pose Estimation"},"content":{"rendered":"<div class=\"wp-block-group has-global-padding is-layout-constrained wp-container-core-group-is-layout-f00c8009 wp-block-group-is-layout-constrained\" style=\"padding-right:5%;padding-left:5%\">\n<div class=\"wp-block-group has-global-padding is-layout-constrained wp-block-group-is-layout-constrained\">\n    <div\n        class=\"wp-block-buttons is-content-justification-center is-layout-flex wp-container-core-buttons-is-layout-1 wp-block-buttons-is-layout-flex\">\n        <div class=\"wp-block-button\" style=\"line-height: 1.5;\">\n            <a class=\"wp-block-button__link wp-element-button\"\n                href=\"https:\/\/ieeexplore.ieee.org\/abstract\/document\/9841448\/\" target=\"_blank\"\n                style=\"padding-right: var(--wp--preset--spacing--40); padding-left: var(--wp--preset--spacing--40); display: flex; align-items: center; gap: 8px;\">\n                <div>\n                    <svg class=\"svg-inline--fa fa-file-pdf fa-w-12\" aria-hidden=\"true\" focusable=\"false\"\n                        data-prefix=\"fas\" data-icon=\"file-pdf\" role=\"img\" xmlns=\"http:\/\/www.w3.org\/2000\/svg\"\n                        viewbox=\"0 0 384 512\" style=\"height: 1em; width: 1em;\">\n                        <path fill=\"#FFFFFF\"\n                            d=\"M181.9 256.1c-5-16-4.9-46.9-2-46.9 8.4 0 7.6 36.9 2 46.9zm-1.7 47.2c-7.7 20.2-17.3 43.3-28.4 62.7 18.3-7 39-17.2 62.9-21.9-12.7-9.6-24.9-23.4-34.5-40.8zM86.1 428.1c0 .8 13.2-5.4 34.9-40.2-6.7 6.3-29.1 24.5-34.9 40.2zM248 160h136v328c0 13.3-10.7 24-24 24H24c-13.3 0-24-10.7-24-24V24C0 10.7 10.7 0 24 0h200v136c0 13.2 10.8 24 24 24zm-8 171.8c-20-12.2-33.3-29-42.7-53.8 4.5-18.5 11.6-46.6 6.2-64.2-4.7-29.4-42.4-26.5-47.8-6.8-5 18.3-.4 44.1 8.1 77-11.6 27.6-28.7 64.6-40.8 85.8-.1 0-.1.1-.2.1-27.1 13.9-73.6 44.5-54.5 68 5.6 6.9 16 10 21.5 10 17.9 0 35.7-18 61.1-61.8 25.8-8.5 54.1-19.1 79-23.2 21.7 11.8 47.1 19.5 64 19.5 29.2 0 31.2-32 19.7-43.4-13.9-13.6-54.3-9.7-73.6-7.2zM377 105L279 7c-4.5-4.5-10.6-7-17-7h-6v128h128v-6.1c0-6.3-2.5-12.4-7-16.9zm-74.1 255.3c4.1-2.7-2.5-11.9-42.8-9 37.1 15.8 42.8 9 42.8 9z\">\n                        <\/path>\n                    <\/svg>\n                <\/div>\n                <div>Paper<\/div>\n            <\/a>\n        <\/div>\n\n        <div class=\"wp-block-button\" style=\"line-height: 1.5;\">\n            <a class=\"wp-block-button__link wp-element-button\" href=\"https:\/\/github.com\/PengfeiRen96\/DSF\" target=\"_blank\"\n                style=\"padding-right: var(--wp--preset--spacing--40); padding-left: var(--wp--preset--spacing--40); display: flex; align-items: center; gap: 8px;\">\n                <div>\n                    <svg class=\"svg-inline--fa fa-github fa-w-16\" aria-hidden=\"true\" focusable=\"false\" data-prefix=\"fab\"\n                        data-icon=\"github\" role=\"img\" xmlns=\"http:\/\/www.w3.org\/2000\/svg\" viewbox=\"0 0 496 512\" data-fa-i2svg=\"\"\n                        style=\"height: 1em; width: 1em;\">\n                        <path fill=\"#FFFFFF\"\n                            d=\"M165.9 397.4c0 2-2.3 3.6-5.2 3.6-3.3.3-5.6-1.3-5.6-3.6 0-2 2.3-3.6 5.2-3.6 3-.3 5.6 1.3 5.6 3.6zm-31.1-4.5c-.7 2 1.3 4.3 4.3 4.9 2.6 1 5.6 0 6.2-2s-1.3-4.3-4.3-5.2c-2.6-.7-5.5.3-6.2 2.3zm44.2-1.7c-2.9.7-4.9 2.6-4.6 4.9.3 2 2.9 3.3 5.9 2.6 2.9-.7 4.9-2.6 4.6-4.6-.3-1.9-3-3.2-5.9-2.9zM244.8 8C106.1 8 0 113.3 0 252c0 110.9 69.8 205.8 169.5 239.2 12.8 2.3 17.3-5.6 17.3-12.1 0-6.2-.3-40.4-.3-61.4 0 0-70 15-84.7-29.8 0 0-11.4-29.1-27.8-36.6 0 0-22.9-15.7 1.6-15.4 0 0 24.9 2 38.6 25.8 21.9 38.6 58.6 27.5 72.9 20.9 2.3-16 8.8-27.1 16-33.7-55.9-6.2-112.3-14.3-112.3-110.5 0-27.5 7.6-41.3 23.6-58.9-2.6-6.5-11.1-33.3 2.6-67.9 20.9-6.5 69 27 69 27 20-5.6 41.5-8.5 62.8-8.5s42.8 2.9 62.8 8.5c0 0 48.1-33.6 69-27 13.7 34.7 5.2 61.4 2.6 67.9 16 17.7 25.8 31.5 25.8 58.9 0 96.5-58.9 104.2-114.8 110.5 9.2 7.9 17 22.9 17 46.4 0 33.7-.3 75.4-.3 83.6 0 6.5 4.6 14.4 17.3 12.1C428.2 457.8 496 362.9 496 252 496 113.3 383.5 8 244.8 8zM97.2 352.9c-1.3 1-1 3.3.7 5.2 1.6 1.6 3.9 2.3 5.2 1 1.3-1 1-3.3-.7-5.2-1.6-1.6-3.9-2.3-5.2-1zm-10.8-8.1c-.7 1.3.3 2.9 2.3 3.9 1.6 1 3.6.7 4.3-.7.7-1.3-.3-2.9-2.3-3.9-2-.6-3.6-.3-4.3.7zm32.4 35.6c-1.6 1.3-1 4.3 1.3 6.2 2.3 2.3 5.2 2.6 6.5 1 1.3-1.3.7-4.3-1.3-6.2-2.2-2.3-5.2-2.6-6.5-1zm-11.4-14.7c-1.6 1-1.6 3.6 0 5.9 1.6 2.3 4.3 3.3 5.6 2.3 1.6-1.3 1.6-3.9 0-6.2-1.4-2.3-4-3.3-5.6-2z\">\n                        <\/path>\n                    <\/svg>\n                <\/div>\n                <div>Code<\/div>\n            <\/a>\n        <\/div>\n\n\n    <\/div>\n<\/div>\n\n\n\n<div class=\"wp-block-group alignwide is-content-justification-center is-nowrap is-layout-flex wp-container-core-group-is-layout-23441af8 wp-block-group-is-layout-flex\">\n<figure data-wp-context=\"{&quot;imageId&quot;:&quot;69f8bd60652c5&quot;}\" data-wp-interactive=\"core\/image\" data-wp-key=\"69f8bd60652c5\" class=\"wp-block-image aligncenter size-large wp-lightbox-container\"><img decoding=\"async\" data-wp-class--hide=\"state.isContentHidden\" data-wp-class--show=\"state.isContentVisible\" data-wp-init=\"callbacks.setButtonStyles\" data-wp-on--click=\"actions.showLightbox\" data-wp-on--load=\"callbacks.setButtonStyles\" data-wp-on-window--resize=\"callbacks.setButtonStyles\" src=\"https:\/\/sinkers-pic.oss-cn-beijing.aliyuncs.com\/img\/DSF-ICVL.gif\" alt=\"\" style=\"object-fit:cover\"\/><button\n\t\t\tclass=\"lightbox-trigger\"\n\t\t\ttype=\"button\"\n\t\t\taria-haspopup=\"dialog\"\n\t\t\taria-label=\"\u653e\u5927\"\n\t\t\tdata-wp-init=\"callbacks.initTriggerButton\"\n\t\t\tdata-wp-on--click=\"actions.showLightbox\"\n\t\t\tdata-wp-style--right=\"state.imageButtonRight\"\n\t\t\tdata-wp-style--top=\"state.imageButtonTop\"\n\t\t>\n\t\t\t<svg xmlns=\"http:\/\/www.w3.org\/2000\/svg\" width=\"12\" height=\"12\" fill=\"none\" viewbox=\"0 0 12 12\">\n\t\t\t\t<path fill=\"#fff\" d=\"M2 0a2 2 0 0 0-2 2v2h1.5V2a.5.5 0 0 1 .5-.5h2V0H2Zm2 10.5H2a.5.5 0 0 1-.5-.5V8H0v2a2 2 0 0 0 2 2h2v-1.5ZM8 12v-1.5h2a.5.5 0 0 0 .5-.5V8H12v2a2 2 0 0 1-2 2H8Zm2-12a2 2 0 0 1 2 2v2h-1.5V2a.5.5 0 0 0-.5-.5H8V0h2Z\" \/>\n\t\t\t<\/svg>\n\t\t<\/button><figcaption class=\"wp-element-caption\">ICVL Dataset<\/figcaption><\/figure>\n\n\n\n<figure data-wp-context=\"{&quot;imageId&quot;:&quot;69f8bd60658f5&quot;}\" data-wp-interactive=\"core\/image\" data-wp-key=\"69f8bd60658f5\" class=\"wp-block-image aligncenter size-large wp-lightbox-container\"><img decoding=\"async\" data-wp-class--hide=\"state.isContentHidden\" data-wp-class--show=\"state.isContentVisible\" data-wp-init=\"callbacks.setButtonStyles\" data-wp-on--click=\"actions.showLightbox\" data-wp-on--load=\"callbacks.setButtonStyles\" data-wp-on-window--resize=\"callbacks.setButtonStyles\" src=\"https:\/\/sinkers-pic.oss-cn-beijing.aliyuncs.com\/img\/ezgif-31a96619f405b1.gif\" alt=\"\" style=\"object-fit:cover\"\/><button\n\t\t\tclass=\"lightbox-trigger\"\n\t\t\ttype=\"button\"\n\t\t\taria-haspopup=\"dialog\"\n\t\t\taria-label=\"\u653e\u5927\"\n\t\t\tdata-wp-init=\"callbacks.initTriggerButton\"\n\t\t\tdata-wp-on--click=\"actions.showLightbox\"\n\t\t\tdata-wp-style--right=\"state.imageButtonRight\"\n\t\t\tdata-wp-style--top=\"state.imageButtonTop\"\n\t\t>\n\t\t\t<svg xmlns=\"http:\/\/www.w3.org\/2000\/svg\" width=\"12\" height=\"12\" fill=\"none\" viewbox=\"0 0 12 12\">\n\t\t\t\t<path fill=\"#fff\" d=\"M2 0a2 2 0 0 0-2 2v2h1.5V2a.5.5 0 0 1 .5-.5h2V0H2Zm2 10.5H2a.5.5 0 0 1-.5-.5V8H0v2a2 2 0 0 0 2 2h2v-1.5ZM8 12v-1.5h2a.5.5 0 0 0 .5-.5V8H12v2a2 2 0 0 1-2 2H8Zm2-12a2 2 0 0 1 2 2v2h-1.5V2a.5.5 0 0 0-.5-.5H8V0h2Z\" \/>\n\t\t\t<\/svg>\n\t\t<\/button><figcaption class=\"wp-element-caption\">MSRA Dataset<\/figcaption><\/figure>\n<\/div>\n\n\n\n<p class=\"has-text-align-center has-x-small-font-size\">For ICVL and MSRA, we show that DSF is able to generate more reasonable hand poses than annotations. <br>We use red circles to locate errors in annotations.<\/p>\n\n\n\n<h2 class=\"wp-block-heading\">Overview<\/h2>\n\n\n\n<figure data-wp-context=\"{&quot;imageId&quot;:&quot;69f8bd6067286&quot;}\" data-wp-interactive=\"core\/image\" data-wp-key=\"69f8bd6067286\" class=\"wp-block-image size-full wp-lightbox-container\"><img loading=\"lazy\" decoding=\"async\" width=\"2869\" height=\"1192\" data-wp-class--hide=\"state.isContentHidden\" data-wp-class--show=\"state.isContentVisible\" data-wp-init=\"callbacks.setButtonStyles\" data-wp-on--click=\"actions.showLightbox\" data-wp-on--load=\"callbacks.setButtonStyles\" data-wp-on-window--resize=\"callbacks.setButtonStyles\" src=\"https:\/\/511cvlab.sinkers.cn\/wp-content\/uploads\/2024\/12\/image-7.png\" alt=\"\" class=\"wp-image-794\" srcset=\"https:\/\/cv.nirc.top\/wp-content\/uploads\/2024\/12\/image-7.png 2869w, https:\/\/cv.nirc.top\/wp-content\/uploads\/2024\/12\/image-7-300x125.png 300w, https:\/\/cv.nirc.top\/wp-content\/uploads\/2024\/12\/image-7-1024x425.png 1024w, https:\/\/cv.nirc.top\/wp-content\/uploads\/2024\/12\/image-7-768x319.png 768w, https:\/\/cv.nirc.top\/wp-content\/uploads\/2024\/12\/image-7-1536x638.png 1536w, https:\/\/cv.nirc.top\/wp-content\/uploads\/2024\/12\/image-7-2048x851.png 2048w\" sizes=\"auto, (max-width: 2869px) 100vw, 2869px\" \/><button\n\t\t\tclass=\"lightbox-trigger\"\n\t\t\ttype=\"button\"\n\t\t\taria-haspopup=\"dialog\"\n\t\t\taria-label=\"\u653e\u5927\"\n\t\t\tdata-wp-init=\"callbacks.initTriggerButton\"\n\t\t\tdata-wp-on--click=\"actions.showLightbox\"\n\t\t\tdata-wp-style--right=\"state.imageButtonRight\"\n\t\t\tdata-wp-style--top=\"state.imageButtonTop\"\n\t\t>\n\t\t\t<svg xmlns=\"http:\/\/www.w3.org\/2000\/svg\" width=\"12\" height=\"12\" fill=\"none\" viewbox=\"0 0 12 12\">\n\t\t\t\t<path fill=\"#fff\" d=\"M2 0a2 2 0 0 0-2 2v2h1.5V2a.5.5 0 0 1 .5-.5h2V0H2Zm2 10.5H2a.5.5 0 0 1-.5-.5V8H0v2a2 2 0 0 0 2 2h2v-1.5ZM8 12v-1.5h2a.5.5 0 0 0 .5-.5V8H12v2a2 2 0 0 1-2 2H8Zm2-12a2 2 0 0 1 2 2v2h-1.5V2a.5.5 0 0 0-.5-.5H8V0h2Z\" \/>\n\t\t\t<\/svg>\n\t\t<\/button><figcaption class=\"wp-element-caption\">Overview of our proposed dual-branch self-boosting framework (DSF).<\/figcaption><\/figure>\n\n\n\n<p class=\"text-justify\">Through image-to-image translation technology, our framework can make better use of synthetic data for pre-training. The dual-branch design allows our framework to adopt a part-aware model-fitting loss for self-supervised learning on unlabeled real data while achieving high-accuracy pose estimation and flexible and robust hand model estimation simultaneously.<\/p>\n\n\n\n<h2 class=\"wp-block-heading\">Qualitative Results<\/h2>\n\n\n\n<figure data-wp-context=\"{&quot;imageId&quot;:&quot;69f8bd6067b1b&quot;}\" data-wp-interactive=\"core\/image\" data-wp-key=\"69f8bd6067b1b\" class=\"wp-block-image size-large wp-lightbox-container\"><img decoding=\"async\" data-wp-class--hide=\"state.isContentHidden\" data-wp-class--show=\"state.isContentVisible\" data-wp-init=\"callbacks.setButtonStyles\" data-wp-on--click=\"actions.showLightbox\" data-wp-on--load=\"callbacks.setButtonStyles\" data-wp-on-window--resize=\"callbacks.setButtonStyles\" src=\"https:\/\/sinkers-pic.oss-cn-beijing.aliyuncs.com\/img\/DSF-WechatIMG77.jpg\" alt=\"\"\/><button\n\t\t\tclass=\"lightbox-trigger\"\n\t\t\ttype=\"button\"\n\t\t\taria-haspopup=\"dialog\"\n\t\t\taria-label=\"\u653e\u5927\"\n\t\t\tdata-wp-init=\"callbacks.initTriggerButton\"\n\t\t\tdata-wp-on--click=\"actions.showLightbox\"\n\t\t\tdata-wp-style--right=\"state.imageButtonRight\"\n\t\t\tdata-wp-style--top=\"state.imageButtonTop\"\n\t\t>\n\t\t\t<svg xmlns=\"http:\/\/www.w3.org\/2000\/svg\" width=\"12\" height=\"12\" fill=\"none\" viewbox=\"0 0 12 12\">\n\t\t\t\t<path fill=\"#fff\" d=\"M2 0a2 2 0 0 0-2 2v2h1.5V2a.5.5 0 0 1 .5-.5h2V0H2Zm2 10.5H2a.5.5 0 0 1-.5-.5V8H0v2a2 2 0 0 0 2 2h2v-1.5ZM8 12v-1.5h2a.5.5 0 0 0 .5-.5V8H12v2a2 2 0 0 1-2 2H8Zm2-12a2 2 0 0 1 2 2v2h-1.5V2a.5.5 0 0 0-.5-.5H8V0h2Z\" \/>\n\t\t\t<\/svg>\n\t\t<\/button><figcaption class=\"wp-element-caption\">Qualitative results for NYU dataset.<\/figcaption><\/figure>\n\n\n\n<p class=\"text-justify\">\u2705 DSF can maintain the rationality of hand pose when <strong>fingers contact intensively<\/strong>, such as <strong>clenching <\/strong>(3361) or when <strong>fingers are pressed together<\/strong> (3993).<\/p>\n\n\n\n<p class=\"text-justify\">\u2705 DSF is robust to <strong>extreme perspective<\/strong> (609, 4606) and the <strong>depth holes<\/strong> (1194, 4329). Although DSF\u2019s predictions in missing regions do not completely consistent with the ground truth, they remain <strong>structurally reasonable<\/strong>.<\/p>\n\n\n\n<p class=\"text-justify\">\u2705 DSF can predict <strong>complex hand poses<\/strong> (5027, 7122, 6817) with high accuracy.<\/p>\n\n\n\n<figure data-wp-context=\"{&quot;imageId&quot;:&quot;69f8bd6067fb9&quot;}\" data-wp-interactive=\"core\/image\" data-wp-key=\"69f8bd6067fb9\" class=\"wp-block-image size-large wp-lightbox-container\" style=\"margin-top:var(--wp--preset--spacing--50)\"><img decoding=\"async\" data-wp-class--hide=\"state.isContentHidden\" data-wp-class--show=\"state.isContentVisible\" data-wp-init=\"callbacks.setButtonStyles\" data-wp-on--click=\"actions.showLightbox\" data-wp-on--load=\"callbacks.setButtonStyles\" data-wp-on-window--resize=\"callbacks.setButtonStyles\" src=\"https:\/\/sinkers-pic.oss-cn-beijing.aliyuncs.com\/img\/SDF-WechatIMG72.jpg\" alt=\"\"\/><button\n\t\t\tclass=\"lightbox-trigger\"\n\t\t\ttype=\"button\"\n\t\t\taria-haspopup=\"dialog\"\n\t\t\taria-label=\"\u653e\u5927\"\n\t\t\tdata-wp-init=\"callbacks.initTriggerButton\"\n\t\t\tdata-wp-on--click=\"actions.showLightbox\"\n\t\t\tdata-wp-style--right=\"state.imageButtonRight\"\n\t\t\tdata-wp-style--top=\"state.imageButtonTop\"\n\t\t>\n\t\t\t<svg xmlns=\"http:\/\/www.w3.org\/2000\/svg\" width=\"12\" height=\"12\" fill=\"none\" viewbox=\"0 0 12 12\">\n\t\t\t\t<path fill=\"#fff\" d=\"M2 0a2 2 0 0 0-2 2v2h1.5V2a.5.5 0 0 1 .5-.5h2V0H2Zm2 10.5H2a.5.5 0 0 1-.5-.5V8H0v2a2 2 0 0 0 2 2h2v-1.5ZM8 12v-1.5h2a.5.5 0 0 0 .5-.5V8H12v2a2 2 0 0 1-2 2H8Zm2-12a2 2 0 0 1 2 2v2h-1.5V2a.5.5 0 0 0-.5-.5H8V0h2Z\" \/>\n\t\t\t<\/svg>\n\t\t<\/button><figcaption class=\"wp-element-caption\">Qualitative results for testing in real scenarios on different subjects with different hand sizes and hand poses. For each subject, the first line is the depth images captured by the KinectV2; the second line is the cropped hand depth images and the estimated hand pose; the third line is the estimated hand mesh.<\/figcaption><\/figure>\n\n\n\n<h2 class=\"wp-block-heading\">Comparison to SOTA<\/h2>\n\n\n\n<figure data-wp-context=\"{&quot;imageId&quot;:&quot;69f8bd6068391&quot;}\" data-wp-interactive=\"core\/image\" data-wp-key=\"69f8bd6068391\" class=\"wp-block-image aligncenter size-large is-resized wp-lightbox-container\"><img decoding=\"async\" data-wp-class--hide=\"state.isContentHidden\" data-wp-class--show=\"state.isContentVisible\" data-wp-init=\"callbacks.setButtonStyles\" data-wp-on--click=\"actions.showLightbox\" data-wp-on--load=\"callbacks.setButtonStyles\" data-wp-on-window--resize=\"callbacks.setButtonStyles\" src=\"https:\/\/sinkers-pic.oss-cn-beijing.aliyuncs.com\/img\/DSF-WechatIMG75.jpg\" alt=\"\" style=\"width:500px;height:auto\"\/><button\n\t\t\tclass=\"lightbox-trigger\"\n\t\t\ttype=\"button\"\n\t\t\taria-haspopup=\"dialog\"\n\t\t\taria-label=\"\u653e\u5927\"\n\t\t\tdata-wp-init=\"callbacks.initTriggerButton\"\n\t\t\tdata-wp-on--click=\"actions.showLightbox\"\n\t\t\tdata-wp-style--right=\"state.imageButtonRight\"\n\t\t\tdata-wp-style--top=\"state.imageButtonTop\"\n\t\t>\n\t\t\t<svg xmlns=\"http:\/\/www.w3.org\/2000\/svg\" width=\"12\" height=\"12\" fill=\"none\" viewbox=\"0 0 12 12\">\n\t\t\t\t<path fill=\"#fff\" d=\"M2 0a2 2 0 0 0-2 2v2h1.5V2a.5.5 0 0 1 .5-.5h2V0H2Zm2 10.5H2a.5.5 0 0 1-.5-.5V8H0v2a2 2 0 0 0 2 2h2v-1.5ZM8 12v-1.5h2a.5.5 0 0 0 .5-.5V8H12v2a2 2 0 0 1-2 2H8Zm2-12a2 2 0 0 1 2 2v2h-1.5V2a.5.5 0 0 0-.5-.5H8V0h2Z\" \/>\n\t\t\t<\/svg>\n\t\t<\/button><figcaption class=\"wp-element-caption\">Comparison of the aje (mm) with state-of-the-art methods on NYU dataset.<\/figcaption><\/figure>\n\n\n\n<h2 class=\"wp-block-heading\">Downstream task: Skeleton-based Action Recognition<\/h2>\n\n\n\n<figure data-wp-context=\"{&quot;imageId&quot;:&quot;69f8bd60689f3&quot;}\" data-wp-interactive=\"core\/image\" data-wp-key=\"69f8bd60689f3\" class=\"wp-block-image aligncenter size-large is-resized wp-lightbox-container\"><img decoding=\"async\" data-wp-class--hide=\"state.isContentHidden\" data-wp-class--show=\"state.isContentVisible\" data-wp-init=\"callbacks.setButtonStyles\" data-wp-on--click=\"actions.showLightbox\" data-wp-on--load=\"callbacks.setButtonStyles\" data-wp-on-window--resize=\"callbacks.setButtonStyles\" src=\"https:\/\/sinkers-pic.oss-cn-beijing.aliyuncs.com\/img\/DSF-WechatIMG76.jpg\" alt=\"\" style=\"width:800px\"\/><button\n\t\t\tclass=\"lightbox-trigger\"\n\t\t\ttype=\"button\"\n\t\t\taria-haspopup=\"dialog\"\n\t\t\taria-label=\"\u653e\u5927\"\n\t\t\tdata-wp-init=\"callbacks.initTriggerButton\"\n\t\t\tdata-wp-on--click=\"actions.showLightbox\"\n\t\t\tdata-wp-style--right=\"state.imageButtonRight\"\n\t\t\tdata-wp-style--top=\"state.imageButtonTop\"\n\t\t>\n\t\t\t<svg xmlns=\"http:\/\/www.w3.org\/2000\/svg\" width=\"12\" height=\"12\" fill=\"none\" viewbox=\"0 0 12 12\">\n\t\t\t\t<path fill=\"#fff\" d=\"M2 0a2 2 0 0 0-2 2v2h1.5V2a.5.5 0 0 1 .5-.5h2V0H2Zm2 10.5H2a.5.5 0 0 1-.5-.5V8H0v2a2 2 0 0 0 2 2h2v-1.5ZM8 12v-1.5h2a.5.5 0 0 0 .5-.5V8H12v2a2 2 0 0 1-2 2H8Zm2-12a2 2 0 0 1 2 2v2h-1.5V2a.5.5 0 0 0-.5-.5H8V0h2Z\" \/>\n\t\t\t<\/svg>\n\t\t<\/button><figcaption class=\"wp-element-caption\">The comparison of the recognition accuracy (%) with the SOTA approaches on SHREC and DHG datasets. The upward arrows represent the improvement compared to DG-STA.<\/figcaption><\/figure>\n\n\n\n<p class=\"text-justify\">Using the 3D skeleton generated by DSF can greatly improve the accuracy of the skeleton-based action recognition, which shows that our method has strong application potential in downstream tasks.<\/p>\n\n\n\n<h2 class=\"wp-block-heading\">Conclusion<\/h2>\n\n\n\n<p class=\"text-justify\">In this paper, we propose a Dual-branch Self-boosting Framework (DSF) to achieve accurate, robust and flexible 3D hand pose and model estimation without using any labeled real data.<\/p>\n\n\n\n<p class=\"text-justify\">1\ufe0f\u20e3 Firstly, we propose an <strong>image-to-image translation technology<\/strong> to reduce the domain gap between synthetic data and real data, which significantly improves the effect of network pre-training.<\/p>\n\n\n\n<p class=\"text-justify\">2\ufe0f\u20e3 Secondly, we propose a dual-branch self-boosting network that can maintain the accuracy of 3D pose estimation and the robustness and flexibility of 3D hand model estimation simultaneously.<\/p>\n\n\n\n<p class=\"text-justify\">3\ufe0f\u20e3 Through an <strong>inter-branch loss<\/strong> and a <strong>part-aware model-fitting loss<\/strong>, we fully explore the advantages of the dual-branch structure. The two branches can promote each other continuously during the self-supervised training on unlabeled real data.<\/p>\n\n\n\n<p class=\"text-justify\">\u2705 Our method achieves comparable results to state-of-the-art fully supervised methods and shows better generalization performance.<\/p>\n\n\n\n<p class=\"text-justify\">\u2705  Our method outperforms previous self-supervised methods without using paired multi-view images.<\/p>\n\n\n\n<p class=\"text-justify\">\u2705 In addition, our method greatly improves the accuracy of skeleton-based gesture recognition, which shows that our method has strong application potential in downstream tasks\u200b.<\/p>\n\n\n\n<div class=\"wp-block-group is-layout-flow wp-block-group-is-layout-flow\">\n<h2 class=\"wp-block-heading\">Supplementary Videos<\/h2>\n\n\n\n<details class=\"wp-block-details is-layout-flow wp-block-details-is-layout-flow\"><summary>This video shows the performance of our method on the test set of the NYU dataset.<\/summary>\n<div style=\"text-align: center;\">\n    <iframe loading=\"lazy\" src=\"\/\/player.bilibili.com\/player.html?isOutside=true&#038;aid=114012691963487&#038;bvid=BV1kUAGezEfd&#038;cid=28420541262&#038;p=1&#038;autoplay=0\" \n            width=\"800\" height=\"450\" \n            scrolling=\"no\" \n            border=\"0\" frameborder=\"no\" \n            framespacing=\"0\" allowfullscreen=\"true\"><\/iframe>\n<\/div>\n<\/details>\n\n\n\n<details class=\"wp-block-details text-justify is-layout-flow wp-block-details-is-layout-flow\"><summary>This video shows the performance of our method on the test set of the ICVL dataset, qualitatively demonstrating that our method can generate more reasonable hand poses than annotations. We use red circles to locate errors in annotations.<\/summary>\n<div style=\"text-align: center;\">\n    <iframe loading=\"lazy\" src=\"\/\/player.bilibili.com\/player.html?isOutside=true&#038;aid=114012708674484&#038;bvid=BV1WmAGegEiH&#038;cid=28420670377&#038;p=1&#038;autoplay=0\" \n            width=\"800\" height=\"450\" \n            scrolling=\"no\" \n            border=\"0\" frameborder=\"no\" \n            framespacing=\"0\" allowfullscreen=\"true\"><\/iframe>\n<\/div>\n<\/details>\n\n\n\n<details class=\"wp-block-details text-justify is-layout-flow wp-block-details-is-layout-flow\"><summary>This video shows the performance of our method on the MSRA dataset (subject 0), qualitatively demonstrating that our method can generate more reasonable hand poses than annotations. We use red circles to locate errors in annotations.<\/summary>\n<div style=\"text-align: center;\">\n    <iframe loading=\"lazy\" src=\"\/\/player.bilibili.com\/player.html?isOutside=true&#038;aid=114012725451821&#038;bvid=BV1LPAVebEGv&#038;cid=28420671856&#038;p=1&#038;autoplay=0\" \n            width=\"800\" height=\"450\" \n            scrolling=\"no\" \n            border=\"0\" frameborder=\"no\" \n            framespacing=\"0\" allowfullscreen=\"true\"><\/iframe>\n<\/div>\n<\/details>\n<\/div>\n\n\n\n<h2 class=\"wp-block-heading\">Bibtex<\/h2>\n\n\n\n<pre class=\"wp-block-code\"><code>@ARTICLE{9841448,\n  author={Ren, Pengfei and Sun, Haifeng and Hao, Jiachang and Qi, Qi and Wang, Jingyu and Liao, Jianxin},\n  journal={IEEE Transactions on Image Processing}, \n  title={A Dual-Branch Self-Boosting Framework for Self-Supervised 3D Hand Pose Estimation}, \n  year={2022},\n  volume={31},\n  number={},\n  pages={5052-5066},\n  doi={10.1109\/TIP.2022.3192708}}<\/code><\/pre>\n\n\n\n<p class=\"has-medium-font-size\"><\/p>\n<\/div>\n\n\n\n<p><\/p>","protected":false},"excerpt":{"rendered":"<p>Paper Code For ICVL and MSRA, we show that DSF is able to generate more reasonable hand poses than annotations. We use red circles to locate errors in annotations. Overview Through image-to-image translation technology, our framework can make better use of synthetic data for pre-training. The dual-branch design allows our framework to adopt a part-aware [&hellip;]<\/p>\n","protected":false},"author":1,"featured_media":794,"comment_status":"open","ping_status":"open","sticky":false,"template":"","format":"standard","meta":{"_acf_changed":false,"footnotes":"","_links_to":"","_links_to_target":""},"categories":[18],"tags":[],"class_list":["post-793","post","type-post","status-publish","format-standard","has-post-thumbnail","hentry","category-self-supervised-3d-hand-reconstruction"],"acf":{"writer":{"simple_value_formatted":"<code><em>This data type is not supported! Please contact the author for help.<\/em><\/code>","value_formatted":[{"writer_link":{"simple_value_formatted":"<a href=\"https:\/\/pengfeiren96.github.io\/\" target=\"_blank\" rel=\"noreferrer noopener\">Pengfei Ren<\/a>","value_formatted":{"title":"Pengfei Ren","url":"https:\/\/pengfeiren96.github.io\/","target":"_blank"},"value":{"title":"Pengfei Ren","url":"https:\/\/pengfeiren96.github.io\/","target":"_blank"},"field":{"ID":2368,"key":"field_687f0c15f3394","label":"\u4f5c\u8005\u4e0e\u4f5c\u8005\u4e3b\u9875","name":"writer_link","aria-label":"","prefix":"acf","type":"link","value":null,"menu_order":0,"instructions":"","required":1,"id":"","class":"","conditional_logic":0,"parent":2366,"wrapper":{"width":"","class":"","id":""},"return_format":"array","allow_in_bindings":1,"_name":"writer_link","_valid":1,"parent_repeater":"field_687f08dfb7e07"}}},{"writer_link":{"simple_value_formatted":"<a href=\"https:\/\/scholar.google.com\/citations?user=dwhbTsEAAAAJ&hl=en\" target=\"_blank\" rel=\"noreferrer noopener\">Haifeng Sun<\/a>","value_formatted":{"title":"Haifeng Sun","url":"https:\/\/scholar.google.com\/citations?user=dwhbTsEAAAAJ&hl=en","target":"_blank"},"value":{"title":"Haifeng Sun","url":"https:\/\/scholar.google.com\/citations?user=dwhbTsEAAAAJ&hl=en","target":"_blank"},"field":{"ID":2368,"key":"field_687f0c15f3394","label":"\u4f5c\u8005\u4e0e\u4f5c\u8005\u4e3b\u9875","name":"writer_link","aria-label":"","prefix":"acf","type":"link","value":null,"menu_order":0,"instructions":"","required":1,"id":"","class":"","conditional_logic":0,"parent":2366,"wrapper":{"width":"","class":"","id":""},"return_format":"array","allow_in_bindings":1,"_name":"writer_link","_valid":1,"parent_repeater":"field_687f08dfb7e07"}}},{"writer_link":{"simple_value_formatted":"<a href=\"https:\/\/orcid.org\/0000-0001-6842-4721\" target=\"_blank\" rel=\"noreferrer noopener\">Jichang Hao<\/a>","value_formatted":{"title":"Jichang Hao","url":"https:\/\/orcid.org\/0000-0001-6842-4721","target":"_blank"},"value":{"title":"Jichang Hao","url":"https:\/\/orcid.org\/0000-0001-6842-4721","target":"_blank"},"field":{"ID":2368,"key":"field_687f0c15f3394","label":"\u4f5c\u8005\u4e0e\u4f5c\u8005\u4e3b\u9875","name":"writer_link","aria-label":"","prefix":"acf","type":"link","value":null,"menu_order":0,"instructions":"","required":1,"id":"","class":"","conditional_logic":0,"parent":2366,"wrapper":{"width":"","class":"","id":""},"return_format":"array","allow_in_bindings":1,"_name":"writer_link","_valid":1,"parent_repeater":"field_687f08dfb7e07"}}},{"writer_link":{"simple_value_formatted":"<a href=\"https:\/\/scholar.google.com\/citations?user=2W2h0SwAAAAJ\" target=\"_blank\" rel=\"noreferrer noopener\">Qi Qi<\/a>","value_formatted":{"title":"Qi Qi","url":"https:\/\/scholar.google.com\/citations?user=2W2h0SwAAAAJ","target":"_blank"},"value":{"title":"Qi Qi","url":"https:\/\/scholar.google.com\/citations?user=2W2h0SwAAAAJ","target":"_blank"},"field":{"ID":2368,"key":"field_687f0c15f3394","label":"\u4f5c\u8005\u4e0e\u4f5c\u8005\u4e3b\u9875","name":"writer_link","aria-label":"","prefix":"acf","type":"link","value":null,"menu_order":0,"instructions":"","required":1,"id":"","class":"","conditional_logic":0,"parent":2366,"wrapper":{"width":"","class":"","id":""},"return_format":"array","allow_in_bindings":1,"_name":"writer_link","_valid":1,"parent_repeater":"field_687f08dfb7e07"}}},{"writer_link":{"simple_value_formatted":"<a href=\"https:\/\/scholar.google.com\/citations?user=H441DjwAAAAJ\" target=\"_blank\" rel=\"noreferrer noopener\">Jingyu Wang<\/a>","value_formatted":{"title":"Jingyu Wang","url":"https:\/\/scholar.google.com\/citations?user=H441DjwAAAAJ","target":"_blank"},"value":{"title":"Jingyu Wang","url":"https:\/\/scholar.google.com\/citations?user=H441DjwAAAAJ","target":"_blank"},"field":{"ID":2368,"key":"field_687f0c15f3394","label":"\u4f5c\u8005\u4e0e\u4f5c\u8005\u4e3b\u9875","name":"writer_link","aria-label":"","prefix":"acf","type":"link","value":null,"menu_order":0,"instructions":"","required":1,"id":"","class":"","conditional_logic":0,"parent":2366,"wrapper":{"width":"","class":"","id":""},"return_format":"array","allow_in_bindings":1,"_name":"writer_link","_valid":1,"parent_repeater":"field_687f08dfb7e07"}}},{"writer_link":{"simple_value_formatted":"<a href=\"https:\/\/dblp.org\/pid\/60\/4951.html\" target=\"_blank\" rel=\"noreferrer noopener\">Jianxin Liao<\/a>","value_formatted":{"title":"Jianxin Liao","url":"https:\/\/dblp.org\/pid\/60\/4951.html","target":"_blank"},"value":{"title":"Jianxin Liao","url":"https:\/\/dblp.org\/pid\/60\/4951.html","target":"_blank"},"field":{"ID":2368,"key":"field_687f0c15f3394","label":"\u4f5c\u8005\u4e0e\u4f5c\u8005\u4e3b\u9875","name":"writer_link","aria-label":"","prefix":"acf","type":"link","value":null,"menu_order":0,"instructions":"","required":1,"id":"","class":"","conditional_logic":0,"parent":2366,"wrapper":{"width":"","class":"","id":""},"return_format":"array","allow_in_bindings":1,"_name":"writer_link","_valid":1,"parent_repeater":"field_687f08dfb7e07"}}}],"value":[{"field_687f0c15f3394":{"title":"Pengfei Ren","url":"https:\/\/pengfeiren96.github.io\/","target":"_blank"}},{"field_687f0c15f3394":{"title":"Haifeng Sun","url":"https:\/\/scholar.google.com\/citations?user=dwhbTsEAAAAJ&hl=en","target":"_blank"}},{"field_687f0c15f3394":{"title":"Jichang Hao","url":"https:\/\/orcid.org\/0000-0001-6842-4721","target":"_blank"}},{"field_687f0c15f3394":{"title":"Qi Qi","url":"https:\/\/scholar.google.com\/citations?user=2W2h0SwAAAAJ","target":"_blank"}},{"field_687f0c15f3394":{"title":"Jingyu Wang","url":"https:\/\/scholar.google.com\/citations?user=H441DjwAAAAJ","target":"_blank"}},{"field_687f0c15f3394":{"title":"Jianxin Liao","url":"https:\/\/dblp.org\/pid\/60\/4951.html","target":"_blank"}}],"field":{"ID":2366,"key":"field_687f08dfb7e07","label":"\u4f5c\u8005","name":"writer","aria-label":"","prefix":"acf","type":"repeater","value":null,"menu_order":0,"instructions":"","required":1,"id":"","class":"","conditional_logic":0,"parent":52,"wrapper":{"width":"","class":"","id":""},"acfe_repeater_stylised_button":0,"layout":"row","pagination":0,"min":0,"max":0,"collapsed":"","button_label":"Add Row","rows_per_page":20,"_name":"writer","_valid":1,"sub_fields":[{"ID":2368,"key":"field_687f0c15f3394","label":"\u4f5c\u8005\u4e0e\u4f5c\u8005\u4e3b\u9875","name":"writer_link","aria-label":"","prefix":"acf","type":"link","value":null,"menu_order":0,"instructions":"","required":1,"id":"","class":"","conditional_logic":0,"parent":2366,"wrapper":{"width":"","class":"","id":""},"return_format":"array","allow_in_bindings":1,"_name":"writer_link","_valid":1,"parent_repeater":"field_687f08dfb7e07"}]}},"\u4f1a\u8bae\u540d\u79f0":{"simple_value_formatted":"TIP","value_formatted":"TIP","value":"TIP","field":{"ID":53,"key":"field_6759c5b33fdb3","label":"\u4f1a\u8bae\u540d\u79f0","name":"\u4f1a\u8bae\u540d\u79f0","aria-label":"","prefix":"acf","type":"text","value":null,"menu_order":1,"instructions":"","required":1,"id":"","class":"","conditional_logic":0,"parent":52,"wrapper":{"width":"","class":"","id":""},"default_value":"\u586b\u5199\u4f1a\u8bae","maxlength":"","allow_in_bindings":1,"placeholder":"","prepend":"","append":"","_name":"\u4f1a\u8bae\u540d\u79f0","_valid":1}},"\u5e74":{"simple_value_formatted":"2022","value_formatted":"2022","value":"2022","field":{"ID":254,"key":"field_675b036a7706e","label":"\u5e74","name":"\u5e74","aria-label":"","prefix":"acf","type":"text","value":null,"menu_order":2,"instructions":"","required":1,"id":"","class":"","conditional_logic":0,"parent":52,"wrapper":{"width":"","class":"","id":""},"default_value":2024,"maxlength":"","allow_in_bindings":1,"placeholder":"","prepend":"","append":"","_name":"\u5e74","_valid":1}},"code":{"simple_value_formatted":"<a href=\"https:\/\/github.com\/PengfeiRen96\/DSF\" target=\"_blank\" rel=\"noreferrer noopener\">Code<\/a>","value_formatted":{"title":"Code","url":"https:\/\/github.com\/PengfeiRen96\/DSF","target":"_blank"},"value":{"title":"Code","url":"https:\/\/github.com\/PengfeiRen96\/DSF","target":"_blank"},"field":{"ID":54,"key":"field_6759c5dc3fdb4","label":"code","name":"code","aria-label":"","prefix":"acf","type":"link","value":null,"menu_order":3,"instructions":"","required":0,"id":"","class":"","conditional_logic":0,"parent":52,"wrapper":{"width":"","class":"","id":""},"return_format":"array","allow_in_bindings":1,"_name":"code","_valid":1}},"arxiv":{"simple_value_formatted":"","value_formatted":"","value":"","field":{"ID":55,"key":"field_6759c5f83fdb5","label":"arXiv","name":"arxiv","aria-label":"","prefix":"acf","type":"link","value":null,"menu_order":4,"instructions":"","required":0,"id":"","class":"","conditional_logic":0,"parent":52,"wrapper":{"width":"","class":"","id":""},"return_format":"array","allow_in_bindings":0,"_name":"arxiv","_valid":1}},"pdf":{"simple_value_formatted":"<a href=\"https:\/\/ieeexplore.ieee.org\/abstract\/document\/9841448\/\" target=\"_blank\" rel=\"noreferrer noopener\">PDF<\/a>","value_formatted":{"title":"PDF","url":"https:\/\/ieeexplore.ieee.org\/abstract\/document\/9841448\/","target":"_blank"},"value":{"title":"PDF","url":"https:\/\/ieeexplore.ieee.org\/abstract\/document\/9841448\/","target":"_blank"},"field":{"ID":56,"key":"field_6759c6b83fdb6","label":"pdf","name":"pdf","aria-label":"","prefix":"acf","type":"link","value":null,"menu_order":5,"instructions":"","required":0,"id":"","class":"","conditional_logic":0,"parent":52,"wrapper":{"width":"","class":"","id":""},"return_format":"array","allow_in_bindings":0,"_name":"pdf","_valid":1}},"rank":{"simple_value_formatted":"\u4e2d\u79d1\u9662\u4e00\u533a, IF=11.041, CCF-A\u7c7b, \u8ba1\u7b97\u673a\u89c6\u89c9\u9886\u57df\u9876\u520a","value_formatted":"\u4e2d\u79d1\u9662\u4e00\u533a, IF=11.041, CCF-A\u7c7b, \u8ba1\u7b97\u673a\u89c6\u89c9\u9886\u57df\u9876\u520a","value":"\u4e2d\u79d1\u9662\u4e00\u533a, IF=11.041, CCF-A\u7c7b, \u8ba1\u7b97\u673a\u89c6\u89c9\u9886\u57df\u9876\u520a","field":{"ID":2316,"key":"field_686b28a2069eb","label":"\u4f1a\u8bae\/\u671f\u520a\u7ea7\u522b","name":"rank","aria-label":"","prefix":"acf","type":"text","value":null,"menu_order":6,"instructions":"","required":0,"id":"","class":"","conditional_logic":0,"parent":52,"wrapper":{"width":"","class":"","id":""},"default_value":"CCF-A","maxlength":"","allow_in_bindings":0,"placeholder":"","prepend":"","append":"","_name":"rank","_valid":1}}},"_links":{"self":[{"href":"https:\/\/cv.nirc.top\/zh\/wp-json\/wp\/v2\/posts\/793","targetHints":{"allow":["GET"]}}],"collection":[{"href":"https:\/\/cv.nirc.top\/zh\/wp-json\/wp\/v2\/posts"}],"about":[{"href":"https:\/\/cv.nirc.top\/zh\/wp-json\/wp\/v2\/types\/post"}],"author":[{"embeddable":true,"href":"https:\/\/cv.nirc.top\/zh\/wp-json\/wp\/v2\/users\/1"}],"replies":[{"embeddable":true,"href":"https:\/\/cv.nirc.top\/zh\/wp-json\/wp\/v2\/comments?post=793"}],"version-history":[{"count":68,"href":"https:\/\/cv.nirc.top\/zh\/wp-json\/wp\/v2\/posts\/793\/revisions"}],"predecessor-version":[{"id":2545,"href":"https:\/\/cv.nirc.top\/zh\/wp-json\/wp\/v2\/posts\/793\/revisions\/2545"}],"wp:featuredmedia":[{"embeddable":true,"href":"https:\/\/cv.nirc.top\/zh\/wp-json\/wp\/v2\/media\/794"}],"wp:attachment":[{"href":"https:\/\/cv.nirc.top\/zh\/wp-json\/wp\/v2\/media?parent=793"}],"wp:term":[{"taxonomy":"category","embeddable":true,"href":"https:\/\/cv.nirc.top\/zh\/wp-json\/wp\/v2\/categories?post=793"},{"taxonomy":"post_tag","embeddable":true,"href":"https:\/\/cv.nirc.top\/zh\/wp-json\/wp\/v2\/tags?post=793"}],"curies":[{"name":"wp","href":"https:\/\/api.w.org\/{rel}","templated":true}]}}