Spaces:
Runtime error
Runtime error
File size: 11,815 Bytes
c79133e |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 163 164 165 166 167 168 169 170 171 172 173 174 175 176 177 178 179 180 181 182 183 184 185 186 187 188 189 190 191 192 193 194 195 196 197 198 199 200 201 202 203 204 205 206 207 208 209 210 211 212 213 214 215 216 217 218 219 220 221 222 223 224 225 226 227 228 229 230 231 232 233 234 235 236 237 238 239 240 241 242 243 244 245 246 247 248 249 250 251 252 253 254 255 256 257 258 259 260 261 262 263 264 265 266 267 268 269 270 271 272 273 274 |
<!DOCTYPE html>
<html>
<head>
<meta charset="utf-8">
<!-- Meta tags for social media banners, these should be filled in appropriatly as they are your "business card" -->
<!-- Replace the content tag with appropriate information -->
<meta name="description" content="Any2AnyTryon: Leveraging Adaptive Position Embeddings for Versatile Virtual Clothing Tasks">
<meta property="og:title" content="Any2AnyTryon"/>
<meta property="og:description" content="A versatile framework for virtual clothing tasks including garment reconstruction, model-free virtual try-on and virtual try-on"/>
<meta property="og:url" content="https://logn-2024.github.io/Any2anyTryon/"/>
<!-- Path to banner image, should be in the path listed below. Optimal dimenssions are 1200X630-->
<meta property="og:image" content="asset/image/teaser.png" />
<meta property="og:image:width" content="1200"/>
<meta property="og:image:height" content="630"/>
<meta name="twitter:title" content="Any2AnyTryon">
<meta name="twitter:description" content="A versatile framework for virtual clothing tasks">
<!-- Path to banner image, should be in the path listed below. Optimal dimenssions are 1200X600-->
<meta name="twitter:image" content="asset/images/teaser.png">
<meta name="twitter:card" content="summary_large_image">
<!-- Keywords for your paper to be indexed by-->
<meta name="keywords" content="virtual try-on, garment reconstruction, diffusion models">
<meta name="viewport" content="width=device-width, initial-scale=1">
<title>Any2AnyTryon</title>
<link rel="icon" type="image/x-icon" href="asset/images/favicon.ico">
<link href="https://fonts.googleapis.com/css?family=Google+Sans|Noto+Sans|Castoro"
rel="stylesheet">
<link rel="stylesheet" href="asset/css/bulma.min.css">
<link rel="stylesheet" href="asset/css/bulma-carousel.min.css">
<link rel="stylesheet" href="asset/css/bulma-slider.min.css">
<link rel="stylesheet" href="asset/css/fontawesome.all.min.css">
<link rel="stylesheet"
href="https://cdn.jsdelivr.net/gh/jpswalsh/academicons@1/css/academicons.min.css">
<link rel="stylesheet" href="asset/css/index.css">
<script src="https://ajax.googleapis.com/ajax/libs/jquery/3.5.1/jquery.min.js"></script>
<script src="https://documentcloud.adobe.com/view-sdk/main.js"></script>
<script defer src="asset/js/fontawesome.all.min.js"></script>
<script src="asset/js/bulma-carousel.min.js"></script>
<script src="asset/js/bulma-slider.min.js"></script>
<script src="asset/js/index.js"></script>
</head>
<body>
<section class="hero">
<div class="hero-body">
<div class="container is-max-desktop">
<div class="columns is-centered">
<div class="column has-text-centered">
<h1 class="title is-1 publication-title">Any2AnyTryon: Leveraging Adaptive Position Embeddings for Versatile Virtual Clothing Tasks</h1>
<div class="is-size-5 publication-authors">
<!-- Paper authors -->
<span class="author-block">
<a href="https://github.com/logn-2024" target="_blank">Hailong Guo</a><sup>1</sup>,</span>
<span class="author-block">
<a href="#" target="_blank">Bohan Zeng</a><sup>2</sup>,</span>
<span class="author-block">
<a href="#" target="_blank">Yiren Song</a><sup>3</sup>
</span>
<span class="author-block">
<a href="#" target="_blank">Wentao Zhang</a><sup>2</sup>
</span>
<span class="author-block">
<a href="#" target="_blank">Chuang Zhang</a><sup>1</sup>
</span>
<span class="author-block">
<a href="#" target="_blank">Jiaming Liu</a><sup>4</sup>
</span>
</div>
<div class="is-size-5 publication-authors">
<span class="author-block"><br><sup>1</sup>Beijing University of Posts and Telecommunications</span>
<span class="author-block"><br><sup>2</sup>Peking University</span><br>
<span class="author-block"><br><sup>3</sup>National University of Singapore</span>
<span class="author-block"><br><sup>4</sup>TiamatAI</span>
</div>
<!-- Github link -->
<span class="link-block">
<a href="https://github.com/logn-2024/Any2anyTryon" target="_blank"
class="external-link button is-normal is-rounded is-dark">
<span class="icon">
<i class="fab fa-github"></i>
</span>
<span>Code</span>
</a>
</span>
<!-- ArXiv abstract Link -->
<span class="link-block">
<a href="https://arxiv.org/abs/2501.15891" target="_blank"
class="external-link button is-normal is-rounded is-dark">
<span class="icon">
<i class="ai ai-arxiv"></i>
</span>
<span>arXiv</span>
</a>
</span>
<!-- Demo link -->
<span class="link-block">
<a href="https://huggingface.co/spaces/jamesliu1217/Any2anyTryon_exp" target="_blank"
class="external-link button is-normal is-rounded is-dark">
<span class="icon">
<i class="fas fa-gamepad"></i>
</span>
<span>Demo</span>
</a>
</span>
<!-- Models link -->
<span class="link-block">
<a href="https://huggingface.co/loooooong/Any2anyTryon" target="_blank"
class="external-link button is-normal is-rounded is-dark">
<span class="icon">
<i class="fas fa-cube"></i>
</span>
<span>Models</span>
</a>
</span>
</div>
</div>
</div>
</div>
</div>
</div>
</section>
<!-- Paper abstract -->
<section class="section hero is-light">
<div class="container is-max-desktop">
<div class="columns is-centered has-text-centered">
<div class="column is-four-fifths">
<h2 class="title is-3">Abstract</h2>
<div class="content has-text-justified">
<p>
Image-based virtual try-on (VTON) aims to generate a virtual try-on result by transferring an input garment onto a target person's image. However, the scarcity of paired garment-model data makes it challenging for existing methods to achieve high generalization and quality in VTON. Also, it limits the ability to generate mask-free try-ons. To tackle the data scarcity problem, approaches such as Stable Garment and MMTryon use a synthetic data strategy, effectively increasing the amount of paired data on the model side. However, existing methods are typically limited to performing specific try-on tasks and lack user-friendliness.
To enhance the generalization and controllability of VTON generation, we propose Any2AnyTryon, which can generate try-on results based on different textual instructions and model garment images to meet various needs, eliminating the reliance on masks, poses, or other conditions. Specifically, we first construct the virtual try-on dataset LAION-Garment, the largest known open-source garment try-on dataset. Then, we introduce adaptive position embedding, which enables the model to generate satisfactory outfitted model images or garment images based on input images of different sizes and categories, significantly enhancing the generalization and controllability of VTON generation. In our experiments, we demonstrate the effectiveness of our Any2AnyTryon and compare it with existing methods. The results show that Any2AnyTryon enables flexible, controllable, and high-quality image-based virtual try-on generation.
</p>
</div>
</div>
</div>
</div>
</section>
<!-- End paper abstract -->
<!-- Image carousel -->
<section class="hero is-small" style="display: none;">
<div class="hero-body">
<div class="container">
<h3 class="title is-4">Garment Reconstruction</h3>
<div id="results-garment" class="carousel results-carousel">
<div class="item">
<!-- Your image here -->
<img src="asset/images/supp_tryoff_wild.png" alt="Garment Reconstruction Results"/>
<h2 class="subtitle has-text-centered">
Garment reconstruction results in the wild.
</h2>
</div>
</div>
</div>
</div>
</section>
<!-- End image carousel -->
<!-- Image carousel -->
<section class="hero is-small">
<div class="hero-body">
<div class="container">
<h3 class="title is-4">Garment Reconstruction</h3>
<div id="results-garment" class="carousel results-carousel">
<div class="item">
<!-- Your image here style="max-height: 600px; width: auto;" -->
<img src="asset/images/supp_tryoff_wild.png" alt="Garment Reconstruction Results" />
<h2 class="subtitle has-text-centered">
Garment reconstruction results in the wild.
</h2>
</div>
</div>
</div>
</div>
</section>
<!-- End image carousel -->
<!-- Image carousel -->
<section class="hero is-small">
<div class="hero-body">
<div class="container">
<h3 class="title is-4">Model-free Virtual Try-on</h3>
<div id="results-model" class="carousel results-carousel">
<div class="item">
<!-- Your image here -->
<img src="asset/images/model_generation_supp.png" alt="Model-free VTON Results"/>
<h2 class="subtitle has-text-centered">
Model-free virtual tryon results
</h2>
</div>
</div>
</div>
</div>
</section>
<!-- End image carousel -->
<!-- Image carousel -->
<section class="hero is-small">
<div class="hero-body">
<div class="container">
<h3 class="title is-4">Virtual Try-on</h3>
<div id="results-vton" class="carousel results-carousel">
<div class="item">
<!-- Your image here -->
<img src="asset/images/tryon_compare.png" alt="VTON Results"/>
<h2 class="subtitle has-text-centered">
Virtual tryon results in the shop
</h2>
</div>
</div>
</div>
</div>
</section>
<!-- End image carousel -->
<!--BibTex citation -->
<section class="section" id="BibTeX">
<div class="container is-max-desktop content">
<h2 class="title">BibTeX</h2>
<pre><code>@misc{guo2025any2anytryonleveragingadaptiveposition,
title={Any2AnyTryon: Leveraging Adaptive Position Embeddings for Versatile Virtual Clothing Tasks},
author={Hailong Guo and Bohan Zeng and Yiren Song and Wentao Zhang and Chuang Zhang and Jiaming Liu},
year={2025},
eprint={2501.15891},
archivePrefix={arXiv},
primaryClass={cs.CV},
url={https://arxiv.org/abs/2501.15891},
}</code></pre>
</div>
</section>
<!--End BibTex citation -->
<footer class="footer">
<div class="container">
<div class="columns is-centered">
<div class="column is-8">
<div class="content">
<p>
Website template from <a href="https://github.com/eliahuhorwitz/Academic-project-page-template">Academic Project Page Template</a>
</p>
</div>
</div>
</div>
</div>
</footer>
<!-- Statcounter tracking code -->
<!-- You can add a tracker to track page visits by creating an account at statcounter.com -->
<!-- End of Statcounter Code -->
</body>
</html> |