{"id":123,"date":"2025-08-15T16:41:30","date_gmt":"2025-08-15T08:41:30","guid":{"rendered":"https:\/\/alyname.top\/index.php\/2025\/08\/15\/high-resolution-image-synthesis-with-latent-diffusion-models\/"},"modified":"2025-08-15T16:44:09","modified_gmt":"2025-08-15T08:44:09","slug":"high-resolution-image-synthesis-with-latent-diffusion-models","status":"publish","type":"post","link":"https:\/\/alyname.top\/index.php\/2025\/08\/15\/high-resolution-image-synthesis-with-latent-diffusion-models\/","title":{"rendered":"\u7b14\u8bb0 &#8211; High-Resolution Image Synthesis with Latent Diffusion Models"},"content":{"rendered":"<p>LDM\uff0c\u53c8\u79f0 Stable Diffusion\u3002<\/p>\n<p>LDM \u60f3\u505a\u7684\u4e8b\u60c5\u662f\u5feb\u901f\u751f\u6210\u9ad8\u6e05\u6670\u5ea6\u7684\u56fe\u7247\u3002\u60f3\u6cd5\u662f\u8fd9\u6837\u7684\uff1aDiffusion \u8fc7\u7a0b\u4e0d\u4e00\u5b9a\u8981\u5728\u539f\u59cb\u56fe\u7247\u4e0a\u505a\uff0c\u53ef\u4ee5\u5728\u8fdb Diffusion \u8fc7\u7a0b\u524d\u52a0\u4e00\u4e2a VAE\uff0c\u628a\u4e00\u4e2a\u5927\u56fe\u7247\u8fc7\u4e00\u4e2a Encoder \u53d8\u6210\u4e00\u4e2a\u5c0f\u7684\u3001\u9690\u7a7a\u95f4\u56fe\u7247\u3002<\/p>\n<p>\u8bad\u5b8c\u4e4b\u540e\u751f\u6210\u7684\u65f6\u5019\u4e5f\u662f\u751f\u6210\u9690\u7a7a\u95f4\u56fe\u7247\uff0c\u7136\u540e\u8fc7\u4e00\u4e2a Decoder \u53d8\u6210\u539f\u56fe\u7247\u3002<\/p>\n<p>\u6b64\u5916 LDM \u8fd8\u505a\u4e86\u4e00\u4e2a\u4e8b\u60c5\uff0c\u5728 U-Net \u91cc\u9762\u63d2\u4e86\u4e00\u4e9b Cross Attention \u5c42\uff0c\u7136\u540e\u7528\u4e00\u4e2a Encoder \u7f16\u7801\u5916\u90e8\u7684\u6587\u672c\u7b49\u6761\u4ef6\uff0c\u7f16\u7801\u540e\u7684\u7ed3\u679c\u585e\u5230 <mjx-container class=\"MathJax\" jax=\"SVG\" style=\"direction: ltr; position: relative;\"><svg style=\"overflow: visible; min-height: 1px; min-width: 1px; vertical-align: -0.439ex;\" xmlns=\"http:\/\/www.w3.org\/2000\/svg\" width=\"4.757ex\" height=\"1.984ex\" role=\"img\" focusable=\"false\" viewBox=\"0 -683 2102.7 877\" aria-hidden=\"true\"><g stroke=\"currentColor\" fill=\"currentColor\" stroke-width=\"0\" transform=\"scale(1,-1)\"><g data-mml-node=\"math\"><g data-mml-node=\"mi\"><path data-c=\"1D43E\" d=\"M285 628Q285 635 228 637Q205 637 198 638T191 647Q191 649 193 661Q199 681 203 682Q205 683 214 683H219Q260 681 355 681Q389 681 418 681T463 682T483 682Q500 682 500 674Q500 669 497 660Q496 658 496 654T495 648T493 644T490 641T486 639T479 638T470 637T456 637Q416 636 405 634T387 623L306 305Q307 305 490 449T678 597Q692 611 692 620Q692 635 667 637Q651 637 651 648Q651 650 654 662T659 677Q662 682 676 682Q680 682 711 681T791 680Q814 680 839 681T869 682Q889 682 889 672Q889 650 881 642Q878 637 862 637Q787 632 726 586Q710 576 656 534T556 455L509 418L518 396Q527 374 546 329T581 244Q656 67 661 61Q663 59 666 57Q680 47 717 46H738Q744 38 744 37T741 19Q737 6 731 0H720Q680 3 625 3Q503 3 488 0H478Q472 6 472 9T474 27Q478 40 480 43T491 46H494Q544 46 544 71Q544 75 517 141T485 216L427 354L359 301L291 248L268 155Q245 63 245 58Q245 51 253 49T303 46H334Q340 37 340 35Q340 19 333 5Q328 0 317 0Q314 0 280 1T180 2Q118 2 85 2T49 1Q31 1 31 11Q31 13 34 25Q38 41 42 43T65 46Q92 46 125 49Q139 52 144 61Q147 65 216 339T285 628Z\" style=\"stroke-width: 3;\"\/><\/g><g data-mml-node=\"mo\" transform=\"translate(889,0)\"><path data-c=\"2C\" d=\"M78 35T78 60T94 103T137 121Q165 121 187 96T210 8Q210 -27 201 -60T180 -117T154 -158T130 -185T117 -194Q113 -194 104 -185T95 -172Q95 -168 106 -156T131 -126T157 -76T173 -3V9L172 8Q170 7 167 6T161 3T152 1T140 0Q113 0 96 17Z\" style=\"stroke-width: 3;\"\/><\/g><g data-mml-node=\"mi\" transform=\"translate(1333.7,0)\"><path data-c=\"1D449\" d=\"M52 648Q52 670 65 683H76Q118 680 181 680Q299 680 320 683H330Q336 677 336 674T334 656Q329 641 325 637H304Q282 635 274 635Q245 630 242 620Q242 618 271 369T301 118L374 235Q447 352 520 471T595 594Q599 601 599 609Q599 633 555 637Q537 637 537 648Q537 649 539 661Q542 675 545 679T558 683Q560 683 570 683T604 682T668 681Q737 681 755 683H762Q769 676 769 672Q769 655 760 640Q757 637 743 637Q730 636 719 635T698 630T682 623T670 615T660 608T652 599T645 592L452 282Q272 -9 266 -16Q263 -18 259 -21L241 -22H234Q216 -22 216 -15Q213 -9 177 305Q139 623 138 626Q133 637 76 637H59Q52 642 52 648Z\" style=\"stroke-width: 3;\"\/><\/g><\/g><\/g><\/svg><mjx-assistive-mml unselectable=\"on\" display=\"inline\" style=\"top: 0px; left: 0px; clip: rect(1px, 1px, 1px, 1px); -webkit-touch-callout: none; -webkit-user-select: none; -khtml-user-select: none; -moz-user-select: none; -ms-user-select: none; user-select: none; position: absolute; padding: 1px 0px 0px 0px; border: 0px; display: block; width: auto; overflow: hidden;\"><math xmlns=\"http:\/\/www.w3.org\/1998\/Math\/MathML\"><mi>K<\/mi><mo>,<\/mo><mi>V<\/mi><\/math><\/mjx-assistive-mml><\/mjx-container> \u91cc\u3002\u8fd9\u6837\u53ef\u4ee5\u5f15\u5165\u5916\u90e8\u63a7\u5236\u3002<s>\u611f\u89c9\u8fd9\u624d\u662f Stable Diffusion \u771f\u6b63\u706b\u8d77\u6765\u7684\u539f\u56e0<\/s><\/p>\n<p><a href=\"https:\/\/arxiv.org\/abs\/2112.10752\">[2112.10752] High-Resolution Image Synthesis with Latent Diffusion Models<\/a><\/p>\n<hr>\n<h5>Latent Space<\/h5>\n<p><img decoding=\"async\" src=\"https:\/\/alyname.top\/wp-content\/uploads\/2025\/08\/Pasted-image-20250809202354.png\" alt=\"Pasted image 20250809202354.png\"><br \/>\nTODO<\/p>\n<div class=\"clearfix\"><\/div>","protected":false},"excerpt":{"rendered":"<p>LDM\uff0c\u53c8\u79f0 Stable Diffusion\u3002 LDM \u60f3\u505a\u7684\u4e8b\u60c5\u662f\u5feb\u901f\u751f\u6210\u9ad8\u6e05\u6670\u5ea6\u7684\u56fe\u7247\u3002\u60f3\u6cd5\u662f\u8fd9\u6837\u7684\uff1aD [&hellip;]<\/p>\n","protected":false},"author":1,"featured_media":0,"comment_status":"open","ping_status":"open","sticky":false,"template":"","format":"standard","meta":{"footnotes":""},"categories":[5],"tags":[],"class_list":["post-123","post","type-post","status-publish","format-standard","hentry","category-research"],"_links":{"self":[{"href":"https:\/\/alyname.top\/index.php\/wp-json\/wp\/v2\/posts\/123","targetHints":{"allow":["GET"]}}],"collection":[{"href":"https:\/\/alyname.top\/index.php\/wp-json\/wp\/v2\/posts"}],"about":[{"href":"https:\/\/alyname.top\/index.php\/wp-json\/wp\/v2\/types\/post"}],"author":[{"embeddable":true,"href":"https:\/\/alyname.top\/index.php\/wp-json\/wp\/v2\/users\/1"}],"replies":[{"embeddable":true,"href":"https:\/\/alyname.top\/index.php\/wp-json\/wp\/v2\/comments?post=123"}],"version-history":[{"count":1,"href":"https:\/\/alyname.top\/index.php\/wp-json\/wp\/v2\/posts\/123\/revisions"}],"predecessor-version":[{"id":132,"href":"https:\/\/alyname.top\/index.php\/wp-json\/wp\/v2\/posts\/123\/revisions\/132"}],"wp:attachment":[{"href":"https:\/\/alyname.top\/index.php\/wp-json\/wp\/v2\/media?parent=123"}],"wp:term":[{"taxonomy":"category","embeddable":true,"href":"https:\/\/alyname.top\/index.php\/wp-json\/wp\/v2\/categories?post=123"},{"taxonomy":"post_tag","embeddable":true,"href":"https:\/\/alyname.top\/index.php\/wp-json\/wp\/v2\/tags?post=123"}],"curies":[{"name":"wp","href":"https:\/\/api.w.org\/{rel}","templated":true}]}}