requirements_sorted.json 175 KB

12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970717273747576777879808182838485868788899091929394959697989910010110210310410510610710810911011111211311411511611711811912012112212312412512612712812913013113213313413513613713813914014114214314414514614714814915015115215315415515615715815916016116216316416516616716816917017117217317417517617717817918018118218318418518618718818919019119219319419519619719819920020120220320420520620720820921021121221321421521621721821922022122222322422522622722822923023123223323423523623723823924024124224324424524624724824925025125225325425525625725825926026126226326426526626726826927027127227327427527627727827928028128228328428528628728828929029129229329429529629729829930030130230330430530630730830931031131231331431531631731831932032132232332432532632732832933033133233333433533633733833934034134234334434534634734834935035135235335435535635735835936036136236336436536636736836937037137237337437537637737837938038138238338438538638738838939039139239339439539639739839940040140240340440540640740840941041141241341441541641741841942042142242342442542642742842943043143243343443543643743843944044144244344444544644744844945045145245345445545645745845946046146246346446546646746846947047147247347447547647747847948048148248348448548648748848949049149249349449549649749849950050150250350450550650750850951051151251351451551651751851952052152252352452552652752852953053153253353453553653753853954054154254354454554654754854955055155255355455555655755855956056156256356456556656756856957057157257357457557657757857958058158258358458558658758858959059159259359459559659759859960060160260360460560660760860961061161261361461561661761861962062162262362462562662762862963063163263363463563663763863964064164264364464564664764864965065165265365465565665765865966066166266366466566666766866967067167267367467567667767867968068168268368468568668768868969069169269369469569669769869970070170270370470570670770870971071171271371471571671771871972072172272372472572672772872973073173273373473573673773873974074174274374474574674774874975075175275375475575675775875976076176276376476576676776876977077177277377477577677777877978078178278378478578678778878979079179279379479579679779879980080180280380480580680780880981081181281381481581681781881982082182282382482582682782882983083183283383483583683783883984084184284384484584684784884985085185285385485585685785885986086186286386486586686786886987087187287387487587687787887988088188288388488588688788888989089189289389489589689789889990090190290390490590690790890991091191291391491591691791891992092192292392492592692792892993093193293393493593693793893994094194294394494594694794894995095195295395495595695795895996096196296396496596696796896997097197297397497597697797897998098198298398498598698798898999099199299399499599699799899910001001100210031004100510061007100810091010101110121013101410151016101710181019102010211022102310241025102610271028102910301031103210331034103510361037103810391040104110421043104410451046104710481049105010511052105310541055105610571058105910601061106210631064106510661067106810691070107110721073107410751076107710781079108010811082108310841085108610871088108910901091109210931094109510961097109810991100110111021103110411051106110711081109111011111112111311141115111611171118111911201121112211231124112511261127112811291130113111321133113411351136113711381139114011411142114311441145114611471148114911501151115211531154115511561157115811591160116111621163116411651166116711681169117011711172117311741175117611771178117911801181118211831184118511861187118811891190119111921193119411951196119711981199120012011202120312041205120612071208120912101211121212131214121512161217121812191220122112221223122412251226122712281229123012311232123312341235123612371238123912401241124212431244124512461247124812491250125112521253125412551256125712581259126012611262126312641265126612671268126912701271127212731274127512761277127812791280128112821283128412851286128712881289129012911292129312941295129612971298129913001301130213031304130513061307130813091310131113121313131413151316131713181319132013211322132313241325132613271328132913301331133213331334133513361337133813391340134113421343134413451346134713481349135013511352135313541355135613571358135913601361136213631364136513661367136813691370137113721373137413751376137713781379138013811382138313841385138613871388138913901391139213931394139513961397139813991400140114021403140414051406140714081409141014111412141314141415141614171418141914201421142214231424142514261427142814291430143114321433143414351436143714381439144014411442144314441445144614471448144914501451145214531454145514561457145814591460146114621463146414651466146714681469147014711472147314741475147614771478147914801481148214831484148514861487148814891490149114921493149414951496149714981499150015011502150315041505150615071508150915101511151215131514151515161517151815191520152115221523152415251526152715281529153015311532153315341535153615371538153915401541154215431544154515461547154815491550155115521553155415551556155715581559156015611562156315641565156615671568156915701571157215731574157515761577157815791580158115821583158415851586158715881589159015911592159315941595159615971598159916001601160216031604160516061607160816091610161116121613161416151616161716181619162016211622162316241625162616271628162916301631163216331634163516361637163816391640164116421643164416451646164716481649165016511652165316541655165616571658165916601661166216631664166516661667166816691670167116721673167416751676167716781679168016811682168316841685168616871688168916901691169216931694169516961697169816991700170117021703170417051706170717081709171017111712171317141715171617171718171917201721172217231724172517261727172817291730173117321733173417351736173717381739174017411742174317441745174617471748174917501751175217531754175517561757175817591760176117621763176417651766176717681769177017711772177317741775177617771778177917801781178217831784178517861787178817891790179117921793179417951796179717981799180018011802180318041805180618071808180918101811181218131814181518161817181818191820182118221823182418251826182718281829183018311832183318341835183618371838183918401841184218431844184518461847184818491850185118521853185418551856185718581859186018611862186318641865186618671868186918701871187218731874187518761877187818791880188118821883188418851886188718881889189018911892189318941895189618971898189919001901190219031904190519061907190819091910191119121913191419151916191719181919192019211922192319241925192619271928192919301931193219331934193519361937193819391940194119421943194419451946194719481949195019511952195319541955195619571958195919601961196219631964196519661967196819691970197119721973197419751976197719781979198019811982198319841985198619871988198919901991199219931994199519961997199819992000200120022003200420052006200720082009201020112012201320142015201620172018201920202021202220232024202520262027202820292030203120322033203420352036203720382039204020412042204320442045204620472048204920502051205220532054205520562057205820592060206120622063206420652066206720682069207020712072207320742075207620772078207920802081208220832084208520862087208820892090209120922093209420952096209720982099210021012102210321042105210621072108210921102111211221132114211521162117211821192120212121222123212421252126212721282129213021312132213321342135213621372138213921402141214221432144214521462147214821492150215121522153215421552156215721582159216021612162216321642165216621672168216921702171217221732174217521762177217821792180218121822183218421852186218721882189219021912192219321942195219621972198219922002201220222032204220522062207220822092210221122122213221422152216221722182219222022212222222322242225222622272228222922302231223222332234223522362237223822392240224122422243224422452246224722482249225022512252225322542255225622572258225922602261226222632264226522662267226822692270227122722273227422752276227722782279228022812282228322842285228622872288228922902291229222932294229522962297229822992300230123022303230423052306230723082309231023112312231323142315231623172318231923202321232223232324232523262327232823292330233123322333233423352336233723382339234023412342234323442345234623472348234923502351235223532354235523562357235823592360236123622363236423652366236723682369237023712372237323742375237623772378237923802381238223832384238523862387238823892390239123922393239423952396239723982399240024012402240324042405240624072408240924102411241224132414241524162417241824192420242124222423242424252426242724282429243024312432243324342435243624372438243924402441244224432444244524462447244824492450245124522453245424552456245724582459246024612462246324642465246624672468246924702471247224732474247524762477247824792480248124822483248424852486248724882489249024912492249324942495249624972498249925002501250225032504250525062507250825092510251125122513251425152516251725182519252025212522252325242525252625272528252925302531253225332534253525362537253825392540254125422543254425452546254725482549255025512552255325542555255625572558255925602561256225632564256525662567256825692570257125722573257425752576257725782579258025812582258325842585258625872588258925902591259225932594259525962597259825992600260126022603260426052606260726082609261026112612261326142615261626172618261926202621262226232624262526262627262826292630263126322633263426352636263726382639264026412642264326442645264626472648264926502651265226532654265526562657265826592660266126622663266426652666266726682669267026712672267326742675267626772678267926802681268226832684268526862687268826892690269126922693269426952696269726982699270027012702270327042705270627072708270927102711271227132714271527162717271827192720272127222723272427252726272727282729273027312732273327342735273627372738273927402741274227432744274527462747274827492750275127522753275427552756275727582759276027612762276327642765276627672768276927702771277227732774277527762777277827792780278127822783278427852786278727882789279027912792279327942795279627972798279928002801280228032804280528062807280828092810281128122813281428152816281728182819282028212822282328242825282628272828282928302831283228332834283528362837283828392840284128422843284428452846284728482849285028512852285328542855285628572858285928602861286228632864286528662867286828692870287128722873287428752876287728782879288028812882288328842885288628872888288928902891289228932894289528962897289828992900290129022903290429052906290729082909291029112912291329142915291629172918291929202921292229232924292529262927292829292930293129322933293429352936293729382939294029412942294329442945294629472948294929502951295229532954295529562957295829592960296129622963296429652966296729682969297029712972297329742975297629772978297929802981298229832984298529862987298829892990299129922993299429952996299729982999300030013002300330043005300630073008300930103011301230133014301530163017301830193020302130223023302430253026302730283029303030313032303330343035303630373038303930403041304230433044304530463047304830493050305130523053305430553056305730583059306030613062306330643065306630673068306930703071307230733074307530763077307830793080308130823083308430853086308730883089309030913092309330943095309630973098309931003101310231033104310531063107310831093110311131123113311431153116311731183119312031213122312331243125312631273128312931303131313231333134313531363137313831393140314131423143314431453146314731483149315031513152315331543155315631573158315931603161316231633164316531663167316831693170317131723173317431753176317731783179318031813182318331843185318631873188318931903191
  1. {
  2. "requirements": [
  3. {
  4. "requirement_id": "REQ_055",
  5. "requirement_text": "生成人物局部特写画面,如放大呈现嘴巴咬食物、手持物品、耳朵佩戴饰品、鼻子、指甲等身体局部细节,画面填充感强,细节清晰可见",
  6. "source_subtree": {
  7. "parent_node": "景别角度",
  8. "parent_id": 15366,
  9. "context_path": "/root/呈现/视觉/构图编排/空间布局/景别角度"
  10. },
  11. "source_nodes": [
  12. "特写近景",
  13. "景别角度"
  14. ],
  15. "source_posts": [
  16. "6649dbe3000000000c018112",
  17. "664c38f0000000001303c21f",
  18. "6687d458000000000a026f91",
  19. "66daeddb000000002603ea42",
  20. "672ed3b6000000003c017f82",
  21. "67862d98000000001a01f443",
  22. "67bee0df000000002802acd1",
  23. "67d55ec7000000000e004e69",
  24. "67e6398f000000001d005ebb",
  25. "682ede8f000000002202bff2",
  26. "683d8695000000001200012a",
  27. "6911532d000000000503bd18",
  28. "692c3402000000000d03b7b7",
  29. "692d3b99000000001e022295",
  30. "69535514000000001e032b26",
  31. "6964d4bf000000001a031a54",
  32. "69672e2d000000001a026263",
  33. "697638e8000000001a025711",
  34. "697a20e9000000001a033338",
  35. "697b64c5000000001a021517"
  36. ],
  37. "matched_capabilities": [
  38. "CAP-001",
  39. "CAP-016"
  40. ],
  41. "capability_combination": "CAP-001 通过提示词描述指定身体局部部位(如'extreme close-up of fingers holding a ring, filling the frame')控制景别和构图,生成局部特写画面;CAP-016 配合高分辨率输出确保局部细节(纹理、质感)清晰可见,满足画面填充感强且细节突出的要求。",
  42. "match_status": "完全满足",
  43. "needs_research": false,
  44. "research_note": ""
  45. },
  46. {
  47. "requirement_id": "REQ_056",
  48. "requirement_text": "生成人物近景半身或胸部以上的画面,突出人物面部表情和情绪,背景适当虚化,让观看者能清楚看到人物的神态与互动感",
  49. "source_subtree": {
  50. "parent_node": "景别角度",
  51. "parent_id": 15366,
  52. "context_path": "/root/呈现/视觉/构图编排/空间布局/景别角度"
  53. },
  54. "source_nodes": [
  55. "特写近景",
  56. "景别角度"
  57. ],
  58. "source_posts": [
  59. "6649dbe3000000000c018112",
  60. "664c38f0000000001303c21f",
  61. "6687d458000000000a026f91",
  62. "66daeddb000000002603ea42",
  63. "672ed3b6000000003c017f82",
  64. "67862d98000000001a01f443",
  65. "67bee0df000000002802acd1",
  66. "67d55ec7000000000e004e69",
  67. "67e6398f000000001d005ebb",
  68. "682ede8f000000002202bff2",
  69. "683d8695000000001200012a",
  70. "6911532d000000000503bd18",
  71. "692c3402000000000d03b7b7",
  72. "692d3b99000000001e022295",
  73. "69535514000000001e032b26",
  74. "6964d4bf000000001a031a54",
  75. "69672e2d000000001a026263",
  76. "697638e8000000001a025711",
  77. "697a20e9000000001a033338",
  78. "697b64c5000000001a021517"
  79. ],
  80. "matched_capabilities": [
  81. "CAP-001",
  82. "CAP-005"
  83. ],
  84. "capability_combination": "CAP-001 通过提示词描述近景半身构图(如'half-body portrait, chest up, shallow depth of field, blurred background, expressive facial emotion')控制景别、背景虚化和情绪氛围;CAP-005 对生成图像中的人脸区域进行增强修复,确保面部表情细节清晰自然、五官比例准确,强化神态与互动感的呈现。",
  85. "match_status": "完全满足",
  86. "needs_research": false,
  87. "research_note": ""
  88. },
  89. {
  90. "requirement_id": "REQ_057",
  91. "requirement_text": "生成产品或物品的极近距离特写图,如食物截面、商品细节、小物件放大展示,画面主体占满画幅,质感和纹理清晰突出",
  92. "source_subtree": {
  93. "parent_node": "景别角度",
  94. "parent_id": 15366,
  95. "context_path": "/root/呈现/视觉/构图编排/空间布局/景别角度"
  96. },
  97. "source_nodes": [
  98. "特写近景",
  99. "景别角度"
  100. ],
  101. "source_posts": [
  102. "6649dbe3000000000c018112",
  103. "664c38f0000000001303c21f",
  104. "6687d458000000000a026f91",
  105. "66daeddb000000002603ea42",
  106. "672ed3b6000000003c017f82",
  107. "67862d98000000001a01f443",
  108. "67bee0df000000002802acd1",
  109. "67d55ec7000000000e004e69",
  110. "67e6398f000000001d005ebb",
  111. "682ede8f000000002202bff2",
  112. "683d8695000000001200012a",
  113. "6911532d000000000503bd18",
  114. "692c3402000000000d03b7b7",
  115. "692d3b99000000001e022295",
  116. "69535514000000001e032b26",
  117. "6964d4bf000000001a031a54",
  118. "69672e2d000000001a026263",
  119. "697638e8000000001a025711",
  120. "697a20e9000000001a033338",
  121. "697b64c5000000001a021517"
  122. ],
  123. "matched_capabilities": [
  124. "CAP-001",
  125. "CAP-016",
  126. "CAP-006"
  127. ],
  128. "capability_combination": "CAP-001 通过提示词描述极近距离微距构图(如'macro close-up of food cross-section, filling the entire frame, sharp texture detail')控制景别和主体占满画幅;CAP-016 在生成阶段直接输出高分辨率图像,确保质感和纹理在原生尺寸下清晰完整;CAP-006 作为补充后处理手段,对已生成图像进行细节增强和放大,进一步突出纹理质感。",
  129. "match_status": "完全满足",
  130. "needs_research": false,
  131. "research_note": ""
  132. },
  133. {
  134. "requirement_id": "REQ_091",
  135. "requirement_text": "生成拟人化动物角色表情包:用AI生成具有丰富表情和情绪的卡通动物形象(如毛茸茸的红色马、灰色驴),能够呈现出沮丧、无奈、委屈等多种情绪状态,配合不同场景背景(办公室、草地、室内),整体风格介于3D皮克斯动画和水彩插画之间,适合搭配幽默文案使用",
  136. "source_subtree": {
  137. "parent_node": "泛化概括",
  138. "parent_id": 15904,
  139. "context_path": "/root/呈现/视觉/视觉气质/视觉风格/艺术风格/泛化概括"
  140. },
  141. "source_nodes": [
  142. "构成单元",
  143. "表现载体",
  144. "风格基调",
  145. "表达技法"
  146. ],
  147. "source_posts": [
  148. "61bdc28b0000000001024896",
  149. "6634a322000000001e01bcd5",
  150. "673c37610000000007029ced",
  151. "67e224cc000000000602a6c5",
  152. "685b68c300000000150226bd",
  153. "6865ec61000000000b02c53b",
  154. "6880a7a7000000000b02f5a6",
  155. "6892d47c0000000025018c4f",
  156. "689b158f000000001b03e512",
  157. "68b15f32000000001d00ef75",
  158. "68bf8639000000001c03efd2",
  159. "68ca143d000000001202c3de",
  160. "68f5976e000000000700dd28",
  161. "6913cafd000000000703402b",
  162. "692cc7ab000000001b030110",
  163. "692d3b99000000001e022295",
  164. "693f425a000000001e00ed26",
  165. "6960924b000000001a037a1c",
  166. "6964ab0e000000001a035c04"
  167. ],
  168. "matched_capabilities": [
  169. "CAP-001",
  170. "CAP-003",
  171. "CAP-004"
  172. ],
  173. "capability_combination": "CAP-001(文本到图像生成)作为核心能力,通过详细提示词描述角色外观、情绪状态和场景背景生成基础图像;CAP-004(风格切换与风格控制)通过风格参考图或LoRA控制3D皮克斯与水彩插画混合风格;CAP-003(图像主体一致性保持)确保同一角色(红色马、灰色驴)在不同情绪和场景中保持外观一致性,实现系列表情包的角色统一",
  174. "match_status": "完全满足",
  175. "needs_research": false,
  176. "research_note": ""
  177. },
  178. {
  179. "requirement_id": "REQ_092",
  180. "requirement_text": "制作图文混排的知识科普长图:以深青色/蓝绿色为底色背景,将心理学等知识内容拆分为多个板块,每个板块搭配风格统一的插画小图(奇幻风格人物、动物等),文字与插图穿插排布,整体呈现出版式清晰、视觉层次丰富的杂志风格科普图文效果",
  181. "source_subtree": {
  182. "parent_node": "泛化概括",
  183. "parent_id": 15904,
  184. "context_path": "/root/呈现/视觉/视觉气质/视觉风格/艺术风格/泛化概括"
  185. },
  186. "source_nodes": [
  187. "组织方式",
  188. "表现载体",
  189. "风格基调",
  190. "表达技法"
  191. ],
  192. "source_posts": [
  193. "61bdc28b0000000001024896",
  194. "6634a322000000001e01bcd5",
  195. "673c37610000000007029ced",
  196. "67e224cc000000000602a6c5",
  197. "685b68c300000000150226bd",
  198. "6865ec61000000000b02c53b",
  199. "6880a7a7000000000b02f5a6",
  200. "6892d47c0000000025018c4f",
  201. "689b158f000000001b03e512",
  202. "68b15f32000000001d00ef75",
  203. "68bf8639000000001c03efd2",
  204. "68ca143d000000001202c3de",
  205. "68f5976e000000000700dd28",
  206. "6913cafd000000000703402b",
  207. "692cc7ab000000001b030110",
  208. "692d3b99000000001e022295",
  209. "693f425a000000001e00ed26",
  210. "6960924b000000001a037a1c",
  211. "6964ab0e000000001a035c04"
  212. ],
  213. "matched_capabilities": [
  214. "CAP-001",
  215. "CAP-004",
  216. "CAP-014"
  217. ],
  218. "capability_combination": "CAP-001 生成各板块所需的奇幻风格插画小图;CAP-004 控制所有插画保持统一的奇幻视觉风格;CAP-014 在图像中渲染文字内容",
  219. "match_status": "需要调研",
  220. "needs_research": true,
  221. "research_note": "现有能力可以生成单张插画(CAP-001)、控制风格统一(CAP-004)、渲染图内文字(CAP-014),但核心缺口在于:1)多板块图文混排的版式编排能力——将多张插画与多段文字按杂志排版逻辑组织为一张完整长图,现有原子能力表中没有专项的版式/排版合成能力;2)长图画布的整体构图控制——如何将深青色底色、多个文字板块、多张插图统一排布在一张长图中,超出了单纯文生图的能力范围。需要调研:是否有支持多元素版式合成的AI工具(如支持模板化排版的图像生成工具),或是否需要结合设计工具(如Canva、Figma)进行后期排版合成。"
  222. },
  223. {
  224. "requirement_id": "REQ_093",
  225. "requirement_text": "生成室内空间效果图:用AI渲染出具有温暖奶油色调的室内场景,包含拱形门洞、藤编家具、自然光影等元素,整体呈现出地中海或法式复古风格的高质感室内设计效果,光线柔和、色调统一,适合作为家居内容的视觉展示",
  226. "source_subtree": {
  227. "parent_node": "泛化概括",
  228. "parent_id": 15904,
  229. "context_path": "/root/呈现/视觉/视觉气质/视觉风格/艺术风格/泛化概括"
  230. },
  231. "source_nodes": [
  232. "构成单元",
  233. "风格基调",
  234. "表现载体"
  235. ],
  236. "source_posts": [
  237. "61bdc28b0000000001024896",
  238. "6634a322000000001e01bcd5",
  239. "673c37610000000007029ced",
  240. "67e224cc000000000602a6c5",
  241. "685b68c300000000150226bd",
  242. "6865ec61000000000b02c53b",
  243. "6880a7a7000000000b02f5a6",
  244. "6892d47c0000000025018c4f",
  245. "689b158f000000001b03e512",
  246. "68b15f32000000001d00ef75",
  247. "68bf8639000000001c03efd2",
  248. "68ca143d000000001202c3de",
  249. "68f5976e000000000700dd28",
  250. "6913cafd000000000703402b",
  251. "692cc7ab000000001b030110",
  252. "692d3b99000000001e022295",
  253. "693f425a000000001e00ed26",
  254. "6960924b000000001a037a1c",
  255. "6964ab0e000000001a035c04"
  256. ],
  257. "matched_capabilities": [
  258. "CAP-001",
  259. "CAP-004",
  260. "CAP-016"
  261. ],
  262. "capability_combination": "CAP-001(文本到图像生成)通过详细提示词描述室内场景元素(拱形门洞、藤编家具、自然光影)、色调(温暖奶油色)和风格(地中海/法式复古)直接生成室内效果图,Midjourney v8或FLUX.2 [max]均有室内设计效果图典型场景支持;CAP-004(风格切换与风格控制)通过风格LoRA或--sref参数精确控制地中海/法式复古风格呈现;CAP-016(生成阶段原生高分辨率输出)确保输出高质感、细节丰富的展示级效果图",
  263. "match_status": "完全满足",
  264. "needs_research": false,
  265. "research_note": ""
  266. },
  267. {
  268. "requirement_id": "REQ_061",
  269. "requirement_text": "生成具有强烈色彩对比的艺术插画,整体画面以高饱和度的红色与蓝色为主色调,两种颜色形成鲜明的冷暖对撞,背景大面积纯色铺底,视觉冲击力极强",
  270. "source_subtree": {
  271. "parent_node": "色彩强化",
  272. "parent_id": 15896,
  273. "context_path": "/root/呈现/视觉/视觉气质/色彩调性/色彩强化"
  274. },
  275. "source_nodes": [
  276. "色彩强化",
  277. "对比度调节"
  278. ],
  279. "source_posts": [
  280. "681c64ce000000002200554c",
  281. "684e2d44000000002100cca7",
  282. "68538f7c000000002400805b",
  283. "689b158f000000001b03e512",
  284. "6964be3900000000210282a4",
  285. "6964beb3000000002103361a",
  286. "6968ef250000000021033c7c",
  287. "6969068e000000000d008b48",
  288. "696b537f00000000220398ad",
  289. "696b658e000000001a01d2ef",
  290. "696ede36000000001a028e03",
  291. "6970693f000000002102bec2",
  292. "697069b7000000002202d264",
  293. "69706a0600000000210282bd",
  294. "6971ec6f000000001a02d248",
  295. "6975b361000000002202d7e8",
  296. "697638e8000000001a025711"
  297. ],
  298. "matched_capabilities": [
  299. "CAP-001",
  300. "CAP-004"
  301. ],
  302. "capability_combination": "CAP-001 通过详细提示词描述高饱和度红蓝对比色调、冷暖对撞、大面积纯色背景等视觉要素直接生成目标插画;CAP-004 可通过风格 LoRA 或 --sref 风格参考图进一步强化特定艺术插画风格,确保色彩饱和度和视觉冲击力符合预期。",
  303. "match_status": "完全满足",
  304. "needs_research": false,
  305. "research_note": ""
  306. },
  307. {
  308. "requirement_id": "REQ_062",
  309. "requirement_text": "在以暗色或单色为主的画面中,用局部的高饱和亮色(如红色心脏、橙色暖光窗口、金黄色星光)作为点睛之笔,让视线自然聚焦到这个色彩亮点上,形成强烈的视觉引导",
  310. "source_subtree": {
  311. "parent_node": "色彩强化",
  312. "parent_id": 15896,
  313. "context_path": "/root/呈现/视觉/视觉气质/色彩调性/色彩强化"
  314. },
  315. "source_nodes": [
  316. "局部点缀",
  317. "色彩强化"
  318. ],
  319. "source_posts": [
  320. "681c64ce000000002200554c",
  321. "684e2d44000000002100cca7",
  322. "68538f7c000000002400805b",
  323. "689b158f000000001b03e512",
  324. "6964be3900000000210282a4",
  325. "6964beb3000000002103361a",
  326. "6968ef250000000021033c7c",
  327. "6969068e000000000d008b48",
  328. "696b537f00000000220398ad",
  329. "696b658e000000001a01d2ef",
  330. "696ede36000000001a028e03",
  331. "6970693f000000002102bec2",
  332. "697069b7000000002202d264",
  333. "69706a0600000000210282bd",
  334. "6971ec6f000000001a02d248",
  335. "6975b361000000002202d7e8",
  336. "697638e8000000001a025711"
  337. ],
  338. "matched_capabilities": [
  339. "CAP-001",
  340. "CAP-004"
  341. ],
  342. "capability_combination": "CAP-001 通过精细提示词描述暗色/单色主基调 + 局部高饱和亮色元素(如红色心脏、橙色窗口、金黄星光)及其位置关系,直接生成具有视觉引导效果的画面;CAP-004 可通过风格参考图或 LoRA 强化特定的明暗对比插画风格,辅助实现局部色彩点缀的艺术效果。",
  343. "match_status": "完全满足",
  344. "needs_research": false,
  345. "research_note": ""
  346. },
  347. {
  348. "requirement_id": "REQ_063",
  349. "requirement_text": "生成整体色调统一、饱和度偏高的场景图,例如全画面笼罩在深蓝色夜光氛围或浓郁的赤红土地色调中,让单一主色调主导整个画面,营造出沉浸式的强烈色彩氛围感",
  350. "source_subtree": {
  351. "parent_node": "色彩强化",
  352. "parent_id": 15896,
  353. "context_path": "/root/呈现/视觉/视觉气质/色彩调性/色彩强化"
  354. },
  355. "source_nodes": [
  356. "色彩强化",
  357. "对比度调节"
  358. ],
  359. "source_posts": [
  360. "681c64ce000000002200554c",
  361. "684e2d44000000002100cca7",
  362. "68538f7c000000002400805b",
  363. "689b158f000000001b03e512",
  364. "6964be3900000000210282a4",
  365. "6964beb3000000002103361a",
  366. "6968ef250000000021033c7c",
  367. "6969068e000000000d008b48",
  368. "696b537f00000000220398ad",
  369. "696b658e000000001a01d2ef",
  370. "696ede36000000001a028e03",
  371. "6970693f000000002102bec2",
  372. "697069b7000000002202d264",
  373. "69706a0600000000210282bd",
  374. "6971ec6f000000001a02d248",
  375. "6975b361000000002202d7e8",
  376. "697638e8000000001a025711"
  377. ],
  378. "matched_capabilities": [
  379. "CAP-001",
  380. "CAP-004"
  381. ],
  382. "capability_combination": "CAP-001 通过提示词明确描述单一主色调(深蓝夜光/赤红土地)、高饱和度、全画面色调统一等要素,直接生成沉浸式氛围场景图;CAP-004 可通过色调风格 LoRA 或 --sref 风格参考图进一步锁定特定色彩氛围风格,确保主色调在整个画面中的主导性和一致性。",
  383. "match_status": "完全满足",
  384. "needs_research": false,
  385. "research_note": ""
  386. },
  387. {
  388. "requirement_id": "REQ_028",
  389. "requirement_text": "将猫咪表情包图片与各种场景素材(办公室、食物、产品、背景环境等)合成拼贴在一起,让猫咪看起来自然地处于这些场景中,形成多格并排的拼贴版式",
  390. "source_subtree": {
  391. "parent_node": "素材重组",
  392. "parent_id": 15888,
  393. "context_path": "/root/呈现/视觉/影像制作/剪辑组接/素材重组"
  394. },
  395. "source_nodes": [
  396. "拼贴并置",
  397. "混剪重组"
  398. ],
  399. "source_posts": [
  400. "68737e97000000000d027b81",
  401. "68789450000000000b01d4a4",
  402. "688366bd000000000d024147",
  403. "68946e0d000000002500ef6e",
  404. "68a43a11000000001c03cc96",
  405. "68be928b000000001c0361ea",
  406. "68c3933e000000001d00a902",
  407. "68d1ebb8000000001203fd96",
  408. "68d610800000000012023282",
  409. "68d76cd100000000120165e4",
  410. "68e0f5750000000007015ff9",
  411. "68ec9d6400000000070389be",
  412. "68f0b8140000000007008b05",
  413. "68f1b573000000000702052e",
  414. "68fa029e0000000007022932",
  415. "68ff53770000000007000d54"
  416. ],
  417. "matched_capabilities": [
  418. "CAP-020"
  419. ],
  420. "capability_combination": "CAP-020 可将猫咪参考图与场景描述合成,但多格并排拼贴版式布局能力存在缺口",
  421. "match_status": "需要调研",
  422. "needs_research": true,
  423. "research_note": "CAP-020 可将猫咪图片与场景合成为单张图,CAP-003 可保持猫咪外观一致性出现在不同场景中。但需求的核心是'多格并排拼贴版式'——即将多张合成结果排列为拼贴画布的版式编排能力,现有原子能力表中没有覆盖图像拼版/画布排列/多图网格布局的能力。需要调研:是否有 AI 工具支持直接生成多格拼贴版式,或是否有图像拼版/排版工具(如 ComfyUI 中的图像拼接节点)可实现多图网格排列输出。"
  424. },
  425. {
  426. "requirement_id": "REQ_029",
  427. "requirement_text": "把猫咪图片与各类装扮道具(帽子、眼镜、服装、假发等)或其他卡通/玩具素材叠加合成,让不同来源的素材无缝融合成一张完整的搞笑图",
  428. "source_subtree": {
  429. "parent_node": "素材重组",
  430. "parent_id": 15888,
  431. "context_path": "/root/呈现/视觉/影像制作/剪辑组接/素材重组"
  432. },
  433. "source_nodes": [
  434. "拼贴并置",
  435. "混剪重组"
  436. ],
  437. "source_posts": [
  438. "68737e97000000000d027b81",
  439. "68789450000000000b01d4a4",
  440. "688366bd000000000d024147",
  441. "68946e0d000000002500ef6e",
  442. "68a43a11000000001c03cc96",
  443. "68be928b000000001c0361ea",
  444. "68c3933e000000001d00a902",
  445. "68d1ebb8000000001203fd96",
  446. "68d610800000000012023282",
  447. "68d76cd100000000120165e4",
  448. "68e0f5750000000007015ff9",
  449. "68ec9d6400000000070389be",
  450. "68f0b8140000000007008b05",
  451. "68f1b573000000000702052e",
  452. "68fa029e0000000007022932",
  453. "68ff53770000000007000d54"
  454. ],
  455. "matched_capabilities": [
  456. "CAP-020",
  457. "CAP-012",
  458. "CAP-003"
  459. ],
  460. "capability_combination": "CAP-020 可将猫咪与道具素材参考图合成到同一画面;CAP-003 可保持猫咪外观特征不变;CAP-012 可对合成结果进行局部修复使边缘融合更自然",
  461. "match_status": "需要调研",
  462. "needs_research": true,
  463. "research_note": "CAP-020 支持多图合成,CAP-003 可保持猫咪主体一致性,CAP-012 可做局部修复融合。但需求强调'不同来源素材无缝融合'——即将现有的猫咪照片与现有的道具素材图像进行精确叠加合成(类似图层合成/抠图贴合),而非重新生成。现有能力更偏向'生成'而非'精确像素级叠加合成'。需要调研:是否有 AI 工具支持将两张现有图像进行精确的前景/背景分离后叠加合成,以及是否有自动抠图+图层合成的 AI 能力(如 ComfyUI 中的背景移除节点 + 图层合并节点)。"
  464. },
  465. {
  466. "requirement_id": "REQ_030",
  467. "requirement_text": "在同一张图中将多只猫咪或同一只猫咪的不同姿态照片拼接组合,配合文字标注形成对话或对比效果的多格拼图",
  468. "source_subtree": {
  469. "parent_node": "素材重组",
  470. "parent_id": 15888,
  471. "context_path": "/root/呈现/视觉/影像制作/剪辑组接/素材重组"
  472. },
  473. "source_nodes": [
  474. "拼贴并置",
  475. "混剪重组"
  476. ],
  477. "source_posts": [
  478. "68737e97000000000d027b81",
  479. "68789450000000000b01d4a4",
  480. "688366bd000000000d024147",
  481. "68946e0d000000002500ef6e",
  482. "68a43a11000000001c03cc96",
  483. "68be928b000000001c0361ea",
  484. "68c3933e000000001d00a902",
  485. "68d1ebb8000000001203fd96",
  486. "68d610800000000012023282",
  487. "68d76cd100000000120165e4",
  488. "68e0f5750000000007015ff9",
  489. "68ec9d6400000000070389be",
  490. "68f0b8140000000007008b05",
  491. "68f1b573000000000702052e",
  492. "68fa029e0000000007022932",
  493. "68ff53770000000007000d54"
  494. ],
  495. "matched_capabilities": [
  496. "CAP-014",
  497. "CAP-003"
  498. ],
  499. "capability_combination": "CAP-003 可保持猫咪外观一致性;CAP-014 可在图像中渲染文字标注内容;但多格拼图版式编排能力缺失",
  500. "match_status": "需要调研",
  501. "needs_research": true,
  502. "research_note": "CAP-003 可处理多张猫咪参考图保持一致性,CAP-014 可渲染对话文字/标注文字。但需求核心是'多格拼图'版式——将多张独立照片排列为多格对比/对话版式(类似漫画分格或表情包多格布局),现有原子能力表中没有覆盖多图网格排版/画布拼接的能力。需要调研:是否有 AI 工具或 ComfyUI 节点支持将多张图像自动排列为多格拼图版式,并支持在格间添加文字标注或对话气泡。"
  503. },
  504. {
  505. "requirement_id": "REQ_075",
  506. "requirement_text": "生成具有强烈光影对比的场景图,画面中光源明显(如阳光折射、水面反光、彩虹色光晕),暗部极深、亮部极亮,整体呈现出戏剧性的明暗反差和光线质感",
  507. "source_subtree": {
  508. "parent_node": "光影质感",
  509. "parent_id": 15897,
  510. "context_path": "/root/呈现/视觉/影像制作/后期处理/画质优化/光影质感"
  511. },
  512. "source_nodes": [
  513. "后期技法",
  514. "材质纹理"
  515. ],
  516. "source_posts": [
  517. "681c64ce000000002200554c",
  518. "68843a4d000000001c037591",
  519. "696078f70000000022038479",
  520. "696079a10000000022031521",
  521. "6960924b000000001a037a1c",
  522. "6964573a000000000d00800e",
  523. "6964ab0e000000001a035c04",
  524. "696b528900000000210333ea",
  525. "696b52dd000000002202c60a",
  526. "696d7ac4000000000e03e459",
  527. "696ede36000000001a028e03",
  528. "6970693f000000002102bec2",
  529. "697069b7000000002202d264",
  530. "69706a0600000000210282bd",
  531. "697569b0000000001a02448c",
  532. "6975b32c000000002102bc55"
  533. ],
  534. "matched_capabilities": [
  535. "CAP-001"
  536. ],
  537. "capability_combination": "CAP-001(文本到图像生成):通过在提示词中精确描述戏剧性光影效果(如 chiaroscuro、dramatic lighting、god rays、caustics、rainbow lens flare、deep shadows、blown highlights 等专业光影词汇),利用 FLUX.2 [max] 或 Midjourney v8 的照片级真实感生成能力,直接生成具有强烈明暗对比和光线质感的场景图。",
  538. "match_status": "需要调研",
  539. "needs_research": true,
  540. "research_note": "CAP-001 可通过提示词描述光影风格来生成具有一定光影对比的图像,但对于'暗部极深、亮部极亮'的精确曝光控制、彩虹色光晕/水面反光等复杂物理光学效果的精准还原,仅靠文本提示词的控制精度存在不确定性。现有能力表中缺少专项的光照物理渲染控制能力(如 HDR 色调映射控制、光线追踪参数调节)。需要调研:1)各模型对极端明暗对比(HDR 风格)的提示词响应效果;2)是否有专门的光效控制 LoRA 或 ComfyUI 节点(如光线追踪、焦散效果节点)可实现更精准的光影控制。"
  541. },
  542. {
  543. "requirement_id": "REQ_076",
  544. "requirement_text": "生成带有明显颗粒感或纸张纹理的插画风格图片,画面整体像是印刷在粗糙介质上,物体表面有细腻的颗粒噪点或手工绘制的笔触肌理",
  545. "source_subtree": {
  546. "parent_node": "光影质感",
  547. "parent_id": 15897,
  548. "context_path": "/root/呈现/视觉/影像制作/后期处理/画质优化/光影质感"
  549. },
  550. "source_nodes": [
  551. "材质纹理",
  552. "后期技法"
  553. ],
  554. "source_posts": [
  555. "681c64ce000000002200554c",
  556. "68843a4d000000001c037591",
  557. "696078f70000000022038479",
  558. "696079a10000000022031521",
  559. "6960924b000000001a037a1c",
  560. "6964573a000000000d00800e",
  561. "6964ab0e000000001a035c04",
  562. "696b528900000000210333ea",
  563. "696b52dd000000002202c60a",
  564. "696d7ac4000000000e03e459",
  565. "696ede36000000001a028e03",
  566. "6970693f000000002102bec2",
  567. "697069b7000000002202d264",
  568. "69706a0600000000210282bd",
  569. "697569b0000000001a02448c",
  570. "6975b32c000000002102bc55"
  571. ],
  572. "matched_capabilities": [
  573. "CAP-001",
  574. "CAP-004"
  575. ],
  576. "capability_combination": "CAP-001(文本到图像生成)+ CAP-004(风格切换与风格控制):使用 CAP-001 生成基础插画内容,同时通过 CAP-004 加载专项风格 LoRA(如 grain texture LoRA、risograph LoRA、screen print LoRA)或在 Midjourney v8 中使用 --sref 上传带颗粒纸张纹理的风格参考图,将整体画面渲染为印刷粗糙介质风格;提示词中补充 film grain、paper texture、risograph、letterpress、hand-drawn brush strokes 等关键词强化效果。",
  577. "match_status": "需要调研",
  578. "needs_research": true,
  579. "research_note": "CAP-001 + CAP-004 组合可以在风格层面生成带颗粒感和笔触肌理的插画,但'细腻的颗粒噪点'和'粗糙介质印刷感'属于后期叠加效果,仅靠生成阶段的提示词和风格 LoRA 可能无法精确控制颗粒密度、纸张纹理强度等参数。现有能力表中缺少专项的后期纹理叠加能力(如将噪点/纸张纹理图层以特定混合模式叠加到生成图像上的 ComfyUI 节点)。需要调研:1)ComfyUI 中是否有图像后期纹理叠加节点(如 Image Blend、Texture Overlay);2)专项颗粒感/印刷风格 LoRA 的可用性和效果;3)是否可通过 img2img 将生成图像与纹理素材合成来精确控制肌理效果。"
  580. },
  581. {
  582. "requirement_id": "REQ_077",
  583. "requirement_text": "生成室内场景时,能真实还原不同材质的质感细节,如木地板的纹路光泽、布艺沙发的绒毛感、大理石茶几的光滑反射、藤编家具的编织纹理等",
  584. "source_subtree": {
  585. "parent_node": "光影质感",
  586. "parent_id": 15897,
  587. "context_path": "/root/呈现/视觉/影像制作/后期处理/画质优化/光影质感"
  588. },
  589. "source_nodes": [
  590. "材质纹理"
  591. ],
  592. "source_posts": [
  593. "681c64ce000000002200554c",
  594. "68843a4d000000001c037591",
  595. "696078f70000000022038479",
  596. "696079a10000000022031521",
  597. "6960924b000000001a037a1c",
  598. "6964573a000000000d00800e",
  599. "6964ab0e000000001a035c04",
  600. "696b528900000000210333ea",
  601. "696b52dd000000002202c60a",
  602. "696d7ac4000000000e03e459",
  603. "696ede36000000001a028e03",
  604. "6970693f000000002102bec2",
  605. "697069b7000000002202d264",
  606. "69706a0600000000210282bd",
  607. "697569b0000000001a02448c",
  608. "6975b32c000000002102bc55"
  609. ],
  610. "matched_capabilities": [
  611. "CAP-001",
  612. "CAP-016"
  613. ],
  614. "capability_combination": "CAP-001(文本到图像生成)+ CAP-016(生成阶段原生高分辨率输出):使用 CAP-001 通过详细的材质描述提示词(如 oak wood floor with visible grain and glossy finish、velvet sofa with soft pile texture、polished marble table with reflective surface、rattan weave pattern 等)生成室内场景;结合 CAP-016 使用 Midjourney v8 --hd 参数或 Nano Banana Pro 4K 输出,在高分辨率下确保木纹、绒毛、大理石纹路、藤编等细节清晰可见。",
  615. "match_status": "需要调研",
  616. "needs_research": true,
  617. "research_note": "CAP-001 + CAP-016 组合可以生成具有一定材质质感的高清室内场景,但对于多种不同材质在同一场景中同时精准还原(尤其是绒毛感的微观纤维细节、藤编的精细编织结构、大理石的真实反射高光)存在挑战,单纯依赖提示词描述的控制精度有限。现有能力表中缺少专项的材质 PBR 渲染控制能力。需要调研:1)专项材质 LoRA(木纹、大理石、布料、藤编)在 ComfyUI 中的可用性;2)FLUX.2 [max] 或 Midjourney v8 对复杂多材质室内场景的实际还原效果;3)是否可通过 ControlNet 材质图或法线图输入来增强特定材质的质感表现。"
  618. },
  619. {
  620. "requirement_id": "REQ_085",
  621. "requirement_text": "生成具有统一色调风格的插画场景,整体画面使用高度协调的单一色系(如全蓝紫色调的火车风景、全粉紫色调的奇幻海洋),让画面中所有元素的颜色都偏向同一个色相,营造出梦幻沉浸的视觉氛围",
  622. "source_subtree": {
  623. "parent_node": "饱和度调节",
  624. "parent_id": 15941,
  625. "context_path": "/root/呈现/视觉/视觉气质/色彩调性/色彩强化/饱和度调节"
  626. },
  627. "source_nodes": [
  628. "单色饱和度",
  629. "饱和度调节"
  630. ],
  631. "source_posts": [
  632. "67bee0df000000002802acd1",
  633. "67e37ff8000000001c008b5e",
  634. "686f606c00000000120167b5",
  635. "689b158f000000001b03e512",
  636. "68b15f32000000001d00ef75",
  637. "68c15181000000001b01c358",
  638. "68e8cac8000000000700da88",
  639. "69002ba70000000007008bcc",
  640. "696078f70000000022038479",
  641. "696079a10000000022031521",
  642. "6964573a000000000d00800e",
  643. "6964be3900000000210282a4",
  644. "696ede36000000001a028e03",
  645. "69756d90000000001a020c81",
  646. "6975b2d7000000002200b4ae",
  647. "6975b3c50000000022020356"
  648. ],
  649. "matched_capabilities": [
  650. "CAP-001",
  651. "CAP-004"
  652. ],
  653. "capability_combination": "CAP-001 通过提示词直接描述目标色调(如'全蓝紫色调'、'monochromatic blue-purple palette')引导生成统一色系画面;CAP-004 可通过风格参考图(--sref)或 LoRA 进一步强化特定色调风格,两者组合可实现单一色系的梦幻插画场景生成",
  654. "match_status": "完全满足",
  655. "needs_research": false,
  656. "research_note": ""
  657. },
  658. {
  659. "requirement_id": "REQ_086",
  660. "requirement_text": "生成色彩鲜艳、多色并置的视觉冲击画面,画面中同时出现多种高饱和度的颜色搭配(如复古拼贴风格中的粉色、蓝色、橙色并置,或彩色条纹波浪地形),让整体色彩浓烈饱满、视觉张力强烈",
  661. "source_subtree": {
  662. "parent_node": "饱和度调节",
  663. "parent_id": 15941,
  664. "context_path": "/root/呈现/视觉/视觉气质/色彩调性/色彩强化/饱和度调节"
  665. },
  666. "source_nodes": [
  667. "配色饱和度",
  668. "饱和度调节"
  669. ],
  670. "source_posts": [
  671. "67bee0df000000002802acd1",
  672. "67e37ff8000000001c008b5e",
  673. "686f606c00000000120167b5",
  674. "689b158f000000001b03e512",
  675. "68b15f32000000001d00ef75",
  676. "68c15181000000001b01c358",
  677. "68e8cac8000000000700da88",
  678. "69002ba70000000007008bcc",
  679. "696078f70000000022038479",
  680. "696079a10000000022031521",
  681. "6964573a000000000d00800e",
  682. "6964be3900000000210282a4",
  683. "696ede36000000001a028e03",
  684. "69756d90000000001a020c81",
  685. "6975b2d7000000002200b4ae",
  686. "6975b3c50000000022020356"
  687. ],
  688. "matched_capabilities": [
  689. "CAP-001",
  690. "CAP-004"
  691. ],
  692. "capability_combination": "CAP-001 通过提示词明确描述多种高饱和度颜色组合(如'vibrant pink, blue, orange, highly saturated, bold color palette')及风格关键词(如'retro collage'、'colorful stripes')直接引导生成高饱和多色画面;CAP-004 可通过风格参考图或 LoRA 强化复古拼贴等特定高饱和风格,两者组合可实现视觉张力强烈的多色并置效果",
  693. "match_status": "完全满足",
  694. "needs_research": false,
  695. "research_note": ""
  696. },
  697. {
  698. "requirement_id": "REQ_087",
  699. "requirement_text": "生成低饱和度或去色风格的极简画面,整体色彩纯度降低,呈现出克制、安静的视觉质感(如黑白灰调的海洋孤舟场景,或接近无彩色的素雅插画),与高饱和度画面形成鲜明对比",
  700. "source_subtree": {
  701. "parent_node": "饱和度调节",
  702. "parent_id": 15941,
  703. "context_path": "/root/呈现/视觉/视觉气质/色彩调性/色彩强化/饱和度调节"
  704. },
  705. "source_nodes": [
  706. "单色饱和度",
  707. "配色饱和度"
  708. ],
  709. "source_posts": [
  710. "67bee0df000000002802acd1",
  711. "67e37ff8000000001c008b5e",
  712. "686f606c00000000120167b5",
  713. "689b158f000000001b03e512",
  714. "68b15f32000000001d00ef75",
  715. "68c15181000000001b01c358",
  716. "68e8cac8000000000700da88",
  717. "69002ba70000000007008bcc",
  718. "696078f70000000022038479",
  719. "696079a10000000022031521",
  720. "6964573a000000000d00800e",
  721. "6964be3900000000210282a4",
  722. "696ede36000000001a028e03",
  723. "69756d90000000001a020c81",
  724. "6975b2d7000000002200b4ae",
  725. "6975b3c50000000022020356"
  726. ],
  727. "matched_capabilities": [
  728. "CAP-001",
  729. "CAP-004"
  730. ],
  731. "capability_combination": "CAP-001 通过提示词描述低饱和度或去色风格(如'desaturated, monochrome, black and white, muted tones, minimalist')引导生成极简低饱和画面;CAP-004 可通过风格参考图(--sref)或黑白/素雅风格 LoRA 进一步精确控制去色程度和极简视觉质感,两者组合可稳定实现低饱和度插画效果",
  732. "match_status": "完全满足",
  733. "needs_research": false,
  734. "research_note": ""
  735. },
  736. {
  737. "requirement_id": "REQ_046",
  738. "requirement_text": "制作图文卡片式科普内容:每张卡片包含统一的标题样式、编号序列、配套插图(卡通/示意图风格)和说明文字,多张卡片拼成一组,整体风格统一、排版清晰,适合健康养生、步骤教程类内容展示",
  739. "source_subtree": {
  740. "parent_node": "标注图示",
  741. "parent_id": 15886,
  742. "context_path": "/root/呈现/视觉/构图编排/版面设计/标注图示"
  743. },
  744. "source_nodes": [
  745. "图示说明",
  746. "标注图示"
  747. ],
  748. "source_posts": [
  749. "669b52720000000025003596",
  750. "672de546000000001b02cfeb",
  751. "6732f52f000000001b013fdb",
  752. "6735b1a0000000001b0137f5",
  753. "673d9a58000000000702450b",
  754. "67e224cc000000000602a6c5",
  755. "67e27e6e000000000b017c96",
  756. "6810596c000000002301d1a6",
  757. "68f9e8400000000005033268",
  758. "69048be90000000005033c79",
  759. "69200dec000000001f00b884",
  760. "692e7ccf000000001f00a137",
  761. "69394a0b000000001f006ce6",
  762. "694a6caf000000001f00e112"
  763. ],
  764. "matched_capabilities": [
  765. "CAP-001",
  766. "CAP-004",
  767. "CAP-014"
  768. ],
  769. "capability_combination": "CAP-001 生成卡通/示意图风格的配套插图;CAP-004 通过风格控制保证多张卡片插图风格统一;CAP-014 在图像中渲染标题文字和说明文字。但三者组合仍无法解决:多张卡片的统一排版布局(编号序列、标题样式、文字与插图的精确位置关系)、多卡片拼合为一组的版式设计,这些属于图文排版合成能力,超出现有原子能力范围。",
  770. "match_status": "需要调研",
  771. "needs_research": true,
  772. "research_note": "现有能力可以生成单张卡通风格插图(CAP-001)、控制风格统一性(CAP-004)、在图像内渲染文字(CAP-014),但缺少以下关键能力:1)多元素精确排版布局能力——将标题、编号、插图、说明文字按固定模板精确排列在卡片内;2)多卡片批量生成并保持版式一致性的模板化能力;3)将多张卡片拼合为一组长图/组图的图像合成排版能力。需要调研是否有支持模板化图文排版合成的AI工具(如支持固定版式的图文生成工具),或是否需要结合设计工具(如Canva API、Adobe Express等)实现排版部分。"
  773. },
  774. {
  775. "requirement_id": "REQ_047",
  776. "requirement_text": "制作数据报告类图文内容:包含柱状图、饼图、折线图、词云图、环形图等多种数据可视化图表,配合标题、要点文字说明,整体呈现专业研究报告的视觉风格,色彩搭配统一(如蓝紫色系或橙色系)",
  777. "source_subtree": {
  778. "parent_node": "标注图示",
  779. "parent_id": 15886,
  780. "context_path": "/root/呈现/视觉/构图编排/版面设计/标注图示"
  781. },
  782. "source_nodes": [
  783. "图示说明",
  784. "标注图示"
  785. ],
  786. "source_posts": [
  787. "669b52720000000025003596",
  788. "672de546000000001b02cfeb",
  789. "6732f52f000000001b013fdb",
  790. "6735b1a0000000001b0137f5",
  791. "673d9a58000000000702450b",
  792. "67e224cc000000000602a6c5",
  793. "67e27e6e000000000b017c96",
  794. "6810596c000000002301d1a6",
  795. "68f9e8400000000005033268",
  796. "69048be90000000005033c79",
  797. "69200dec000000001f00b884",
  798. "692e7ccf000000001f00a137",
  799. "69394a0b000000001f006ce6",
  800. "694a6caf000000001f00e112"
  801. ],
  802. "matched_capabilities": [
  803. "CAP-013",
  804. "CAP-014"
  805. ],
  806. "capability_combination": "CAP-013 可通过实时联网获取真实数据并生成信息图表类图像;CAP-014 可在图像中渲染标题和文字说明。但核心问题在于:AI图像生成工具生成的图表是'看起来像图表的图像',而非基于真实数据精确绘制的数据可视化图表,数值、比例、刻度均不可靠,无法满足专业数据报告的准确性要求。",
  807. "match_status": "需要调研",
  808. "needs_research": true,
  809. "research_note": "现有AI图像生成能力(CAP-001、CAP-014)可以生成'外观像数据报告'的图像,CAP-013可融合实时数据,但存在根本性缺陷:AI生成的柱状图、饼图、折线图等图表中的数据比例、数值标注、坐标轴刻度均为视觉近似,不能保证数据准确性,不适合真实数据报告场景。需要调研:1)是否有AI工具支持输入真实数据后生成精确的数据可视化图表(如基于代码生成图表的AI工具);2)是否可通过代码生成方式(Python matplotlib/echarts等)结合AI进行风格美化来实现;3)若需求仅为'视觉风格展示'而非真实数据,则CAP-001+CAP-014组合可部分满足外观需求,但需明确需求方对数据准确性的要求。"
  810. },
  811. {
  812. "requirement_id": "REQ_048",
  813. "requirement_text": "制作流程图/架构示意图:用箭头、方框、层级结构或立体堆叠图形展示系统架构、业务流程或概念层级关系,配合文字标注说明各模块功能,视觉上清晰呈现逻辑关系",
  814. "source_subtree": {
  815. "parent_node": "标注图示",
  816. "parent_id": 15886,
  817. "context_path": "/root/呈现/视觉/构图编排/版面设计/标注图示"
  818. },
  819. "source_nodes": [
  820. "图示说明",
  821. "标注图示"
  822. ],
  823. "source_posts": [
  824. "669b52720000000025003596",
  825. "672de546000000001b02cfeb",
  826. "6732f52f000000001b013fdb",
  827. "6735b1a0000000001b0137f5",
  828. "673d9a58000000000702450b",
  829. "67e224cc000000000602a6c5",
  830. "67e27e6e000000000b017c96",
  831. "6810596c000000002301d1a6",
  832. "68f9e8400000000005033268",
  833. "69048be90000000005033c79",
  834. "69200dec000000001f00b884",
  835. "692e7ccf000000001f00a137",
  836. "69394a0b000000001f006ce6",
  837. "694a6caf000000001f00e112"
  838. ],
  839. "matched_capabilities": [
  840. "CAP-001",
  841. "CAP-014"
  842. ],
  843. "capability_combination": "CAP-001 可生成外观上类似流程图/架构图的图像;CAP-014 可在图像中渲染文字标注。但AI图像生成工具无法保证箭头指向逻辑正确、方框层级关系准确、各模块文字标注与对应图形精确对应,生成结果在逻辑结构准确性上不可控。",
  844. "match_status": "需要调研",
  845. "needs_research": true,
  846. "research_note": "现有AI图像生成能力可以生成'外观像流程图'的图像,但存在根本性问题:1)逻辑结构准确性无法保证——箭头连接关系、层级从属关系、模块间逻辑流向均由模型视觉生成,不能保证与需求描述的逻辑一致;2)文字标注与图形元素的精确对应关系难以控制——CAP-014虽能渲染文字,但无法保证文字精确出现在对应方框内;3)复杂架构图(多层级、多分支)的结构完整性难以通过提示词精确控制。需要调研:1)是否有AI工具支持通过结构化描述(如JSON/YAML/自然语言)生成逻辑准确的流程图/架构图(如基于Mermaid、PlantUML的AI生成工具);2)是否有图表生成类AI工具(如Eraser AI、Whimsical AI等)可满足此需求;3)若需求侧重视觉美化而非逻辑准确性,CAP-001+CAP-014可满足外观需求。"
  847. },
  848. {
  849. "requirement_id": "REQ_007",
  850. "requirement_text": "生成真实人物在户外或特定场景中的生活记录照片,画面自然真实,包含儿童在公园、农场等户外环境中玩耍的多角度抓拍效果,光线自然,氛围温馨",
  851. "source_subtree": {
  852. "parent_node": "实景拍摄",
  853. "parent_id": 15908,
  854. "context_path": "/root/呈现/视觉/影像制作/实景拍摄"
  855. },
  856. "source_nodes": [
  857. "拍摄概述",
  858. "实景拍摄"
  859. ],
  860. "source_posts": [
  861. "67316440000000001b02e75e",
  862. "675c19320000000002017d1f",
  863. "6776b27d0000000013018545",
  864. "67b2a7f7000000002802a0d7",
  865. "682ede8f000000002202bff2",
  866. "685f974300000000120144db",
  867. "6911532d000000000503bd18",
  868. "691d3112000000001e036559",
  869. "692d3b99000000001e022295",
  870. "692fa7e0000000001e039786",
  871. "693d0b1d000000001e02ba36",
  872. "69535514000000001e032b26",
  873. "69672e2d000000001a026263"
  874. ],
  875. "matched_capabilities": [
  876. "CAP-001",
  877. "CAP-003"
  878. ],
  879. "capability_combination": "CAP-001 负责根据提示词生成户外场景中儿童玩耍的照片级真实感图像(FLUX.2 [max] 或 Nano Banana Pro 均支持照片级真实感输出,可描述公园/农场场景、自然光线、温馨氛围);若需要保持特定儿童人物外观一致性,可结合 CAP-003 上传参考图保持人物特征;多角度抓拍效果可通过多次生成不同构图角度的提示词实现",
  880. "match_status": "需要调研",
  881. "needs_research": true,
  882. "research_note": "CAP-001 可生成照片级真实感的户外儿童场景图像,CAP-003 可保持特定人物外观一致性。但核心问题在于:需求强调的是'真实人物'的生活记录照片,即基于真实存在的特定儿童人物进行场景生成,这涉及真实人脸的高度还原与多角度一致性保持。现有 CAP-003 虽支持角色一致性,但对真实儿童人脸在多角度自然抓拍场景下的还原精度是否足够,以及是否存在伦理/合规限制(真实儿童人脸生成),需要进一步调研各工具的实际表现和使用限制。"
  883. },
  884. {
  885. "requirement_id": "REQ_008",
  886. "requirement_text": "制作将真实人物照片合成到趣味场景中的创意图片,例如把人物缩小放入超市肉类托盘包装内、或与冰雕翅膀等道具结合形成视觉错位的幽默效果",
  887. "source_subtree": {
  888. "parent_node": "实景拍摄",
  889. "parent_id": 15908,
  890. "context_path": "/root/呈现/视觉/影像制作/实景拍摄"
  891. },
  892. "source_nodes": [
  893. "拍摄概述",
  894. "实景拍摄"
  895. ],
  896. "source_posts": [
  897. "67316440000000001b02e75e",
  898. "675c19320000000002017d1f",
  899. "6776b27d0000000013018545",
  900. "67b2a7f7000000002802a0d7",
  901. "682ede8f000000002202bff2",
  902. "685f974300000000120144db",
  903. "6911532d000000000503bd18",
  904. "691d3112000000001e036559",
  905. "692d3b99000000001e022295",
  906. "692fa7e0000000001e039786",
  907. "693d0b1d000000001e02ba36",
  908. "69535514000000001e032b26",
  909. "69672e2d000000001a026263"
  910. ],
  911. "matched_capabilities": [
  912. "CAP-020",
  913. "CAP-003",
  914. "CAP-001",
  915. "CAP-012"
  916. ],
  917. "capability_combination": "CAP-020 支持将真实人物参考图与场景合成(如将人物放入超市托盘场景);CAP-003 保持人物外观特征一致性;CAP-001 生成趣味背景场景(超市托盘包装、冰雕翅膀等);CAP-012 可对合成结果进行局部调整修复,使人物与场景融合更自然",
  918. "match_status": "需要调研",
  919. "needs_research": true,
  920. "research_note": "现有能力组合(CAP-020 + CAP-003 + CAP-001)可以实现将人物参考图合成到新场景中,并保持人物外观。但该需求的核心难点在于:1)视觉错位/比例操控(人物缩小放入托盘)需要精确控制人物与场景的相对比例和透视关系,现有能力表中没有明确支持'比例/透视精确控制合成'的能力;2)真实人物照片的高保真合成(非卡通/插画风格)在复杂错位场景中的融合自然度是否达标;3)冰雕翅膀等道具与人物的光影融合效果。需要调研 Nano Banana Pro 或 FLUX.2 [max] 在复杂比例错位合成场景下的实际表现,以及是否有专项的图像合成/抠图工具可配合使用。"
  921. },
  922. {
  923. "requirement_id": "REQ_009",
  924. "requirement_text": "生成真实场景的多图拼贴展示图,将同一地点或主题的多张实拍照片拼合为一张图文并茂的内容图,适合用于地点打卡、产品展示或生活记录类帖子",
  925. "source_subtree": {
  926. "parent_node": "实景拍摄",
  927. "parent_id": 15908,
  928. "context_path": "/root/呈现/视觉/影像制作/实景拍摄"
  929. },
  930. "source_nodes": [
  931. "拍摄概述",
  932. "实景拍摄"
  933. ],
  934. "source_posts": [
  935. "67316440000000001b02e75e",
  936. "675c19320000000002017d1f",
  937. "6776b27d0000000013018545",
  938. "67b2a7f7000000002802a0d7",
  939. "682ede8f000000002202bff2",
  940. "685f974300000000120144db",
  941. "6911532d000000000503bd18",
  942. "691d3112000000001e036559",
  943. "692d3b99000000001e022295",
  944. "692fa7e0000000001e039786",
  945. "693d0b1d000000001e02ba36",
  946. "69535514000000001e032b26",
  947. "69672e2d000000001a026263"
  948. ],
  949. "matched_capabilities": [
  950. "CAP-001",
  951. "CAP-014"
  952. ],
  953. "capability_combination": "CAP-001 可生成单张照片级真实感场景图像作为拼贴素材;CAP-014 可在图像中嵌入文字说明(地点标注、标题等)实现图文并茂效果",
  954. "match_status": "需要调研",
  955. "needs_research": true,
  956. "research_note": "现有能力表中缺少专项的'多图拼贴排版合成'能力。该需求的核心是将多张图片按照特定版式(九宫格、横排、杂志风等)拼合为一张展示图,并添加文字说明。CAP-001 只能生成单张图像,CAP-014 支持图内文字渲染,但两者组合无法实现多图拼贴排版的核心功能。需要调研:1)是否有 AI 工具支持输入多张图片并自动生成拼贴排版图;2)Nano Banana Pro 的多图输入能力(CAP-020 相关)是否可以用于拼贴排版场景;3)是否需要结合 Canva、Photoshop 等设计工具完成排版,而非纯 AI 生成工具。"
  957. },
  958. {
  959. "requirement_id": "REQ_037",
  960. "requirement_text": "生成同一人物在同一场景中多角度、多姿态的即时抓拍效果图,画面呈现自然随意的动态感,如行走、转身、低头、仰望等非摆拍状态,整体风格真实生活化",
  961. "source_subtree": {
  962. "parent_node": "拍摄方式",
  963. "parent_id": 15892,
  964. "context_path": "/root/呈现/视觉/影像制作/实景拍摄/拍摄方式"
  965. },
  966. "source_nodes": [
  967. "即时捕捉",
  968. "拍摄方式"
  969. ],
  970. "source_posts": [
  971. "68077d02000000001c02dd81",
  972. "69003bb30000000004015797",
  973. "691acd15000000000402134e",
  974. "693f94d80000000019025898",
  975. "6964d4bf000000001a031a54",
  976. "6965d491000000000e00f9b0",
  977. "6969068e000000000d008b48",
  978. "696b658e000000001a01d2ef",
  979. "6971878d000000001a01e6cc",
  980. "697638e8000000001a025711"
  981. ],
  982. "matched_capabilities": [
  983. "CAP-001",
  984. "CAP-003",
  985. "CAP-002"
  986. ],
  987. "capability_combination": "CAP-003(图像主体一致性保持)确保同一人物在多张图中外观一致;CAP-002(结构/姿态控制生成)通过OpenPose骨架控制行走、转身、低头、仰望等不同姿态;CAP-001(文本到图像生成)通过提示词描述抓拍风格、真实生活化氛围和场景",
  988. "match_status": "需要调研",
  989. "needs_research": true,
  990. "research_note": "现有能力可以做到:用CAP-003保持人物一致性、用CAP-002控制姿态、用CAP-001描述抓拍风格。但核心缺口在于'即时抓拍/非摆拍'的视觉质感——包括运动模糊、随机构图偏移、快门感、画面轻微倾斜等模拟真实抓拍的视觉特征,现有能力表中没有明确支持此类摄影风格模拟的能力。需要调研:1)主流AI图像生成工具是否支持通过提示词或参数模拟抓拍/街拍摄影风格(如运动模糊、随机构图);2)ComfyUI是否有专门的运动模糊或摄影风格LoRA可实现此效果"
  991. },
  992. {
  993. "requirement_id": "REQ_038",
  994. "requirement_text": "生成动物(如马)在运动瞬间被捕捉的高动态画面,鬃毛飞扬、肢体伸展,呈现出强烈的瞬间张力和动感,背景简洁以突出主体动态",
  995. "source_subtree": {
  996. "parent_node": "拍摄方式",
  997. "parent_id": 15892,
  998. "context_path": "/root/呈现/视觉/影像制作/实景拍摄/拍摄方式"
  999. },
  1000. "source_nodes": [
  1001. "即时捕捉",
  1002. "拍摄方式"
  1003. ],
  1004. "source_posts": [
  1005. "68077d02000000001c02dd81",
  1006. "69003bb30000000004015797",
  1007. "691acd15000000000402134e",
  1008. "693f94d80000000019025898",
  1009. "6964d4bf000000001a031a54",
  1010. "6965d491000000000e00f9b0",
  1011. "6969068e000000000d008b48",
  1012. "696b658e000000001a01d2ef",
  1013. "6971878d000000001a01e6cc",
  1014. "697638e8000000001a025711"
  1015. ],
  1016. "matched_capabilities": [
  1017. "CAP-001"
  1018. ],
  1019. "capability_combination": "CAP-001(文本到图像生成)通过详细提示词描述马匹运动瞬间、鬃毛飞扬、肢体伸展、简洁背景等视觉要素,利用FLUX.2[max]或Midjourney v8的照片级写实能力生成高动态画面",
  1020. "match_status": "需要调研",
  1021. "needs_research": true,
  1022. "research_note": "现有能力可以做到:用CAP-001通过提示词描述马匹运动瞬间的视觉特征(鬃毛飞扬、肢体伸展、简洁背景),FLUX.2[max]和Midjourney v8的写实能力可生成较高质量的动物动态图。但核心缺口在于:1)'高动态瞬间张力'涉及运动模糊、动态拖影等物理摄影效果,现有能力表未明确说明哪个工具能精准控制这类动态摄影效果;2)动物姿态的精准控制(如特定奔跑步态、肢体伸展角度)——CAP-002的姿态控制主要针对人物OpenPose,对动物姿态控制的支持情况未在能力表中说明。需要调研:AI图像生成工具对动物运动姿态的控制能力,以及模拟高速摄影动态效果的实现方式"
  1023. },
  1024. {
  1025. "requirement_id": "REQ_039",
  1026. "requirement_text": "生成人物在真实日常场景(街头、公园、机场等)中被随手拍下的多张图片拼贴效果,画面构图不刻意、视角多变(含俯拍脚部、镜中自拍、远景抓拍等),整体呈现出碎片化的生活记录感",
  1027. "source_subtree": {
  1028. "parent_node": "拍摄方式",
  1029. "parent_id": 15892,
  1030. "context_path": "/root/呈现/视觉/影像制作/实景拍摄/拍摄方式"
  1031. },
  1032. "source_nodes": [
  1033. "即时捕捉",
  1034. "拍摄方式"
  1035. ],
  1036. "source_posts": [
  1037. "68077d02000000001c02dd81",
  1038. "69003bb30000000004015797",
  1039. "691acd15000000000402134e",
  1040. "693f94d80000000019025898",
  1041. "6964d4bf000000001a031a54",
  1042. "6965d491000000000e00f9b0",
  1043. "6969068e000000000d008b48",
  1044. "696b658e000000001a01d2ef",
  1045. "6971878d000000001a01e6cc",
  1046. "697638e8000000001a025711"
  1047. ],
  1048. "matched_capabilities": [
  1049. "CAP-001",
  1050. "CAP-003"
  1051. ],
  1052. "capability_combination": "CAP-003(图像主体一致性保持)确保多张拼贴图中同一人物外观一致;CAP-001(文本到图像生成)通过提示词分别描述不同场景(街头/公园/机场)和不同视角(俯拍脚部/镜中自拍/远景抓拍)生成多张单图;拼贴排版需额外处理",
  1053. "match_status": "需要调研",
  1054. "needs_research": true,
  1055. "research_note": "现有能力可以做到:用CAP-003+CAP-001生成多张保持人物一致性的不同场景、不同视角单图。但存在两个核心缺口:1)'多张图片拼贴效果'——将多张图像排列为拼贴版式(如照片墙、胶片条、随机散落感)是一种图像合成/排版能力,现有能力表中没有明确的拼贴版式生成能力;2)'碎片化生活记录感'的视觉质感——包括随机构图、画面倾斜、边缘暗角、胶片颗粒等模拟随手拍的风格特征,能力表未明确支持。需要调研:1)AI图像生成工具是否支持直接生成多图拼贴版式效果(如在单张图像中呈现多张照片拼贴的视觉效果);2)模拟随手拍/生活记录风格的提示词策略或专用LoRA/风格模型是否存在"
  1056. },
  1057. {
  1058. "requirement_id": "REQ_067",
  1059. "requirement_text": "生成具有强烈视觉冲击力的超现实主义风格图像:画面以大地色系(深红、赭石、深蓝)为主调,将白马、牛仔等元素置于极简的荒漠/盐湖场景中,营造出孤寂、神秘、如油画般的电影感氛围",
  1060. "source_subtree": {
  1061. "parent_node": "艺术风格",
  1062. "parent_id": 15889,
  1063. "context_path": "/root/呈现/视觉/视觉气质/视觉风格/艺术风格"
  1064. },
  1065. "source_nodes": [
  1066. "视觉冲击",
  1067. "绘画艺术"
  1068. ],
  1069. "source_posts": [
  1070. "648d8edf0000000011013447",
  1071. "65eea166000000000d00c6d8",
  1072. "661dbf91000000001a0119b6",
  1073. "669b52720000000025003596",
  1074. "677b5460000000000b00d33e",
  1075. "686cd3a5000000000d0180b0",
  1076. "68a4107f000000001c00e8e9",
  1077. "68f9e8400000000005033268",
  1078. "692a535f0000000019026d5b",
  1079. "6960924b000000001a037a1c"
  1080. ],
  1081. "matched_capabilities": [
  1082. "CAP-001",
  1083. "CAP-004"
  1084. ],
  1085. "capability_combination": "CAP-001(文本到图像生成)通过详细提示词描述超现实主义风格、大地色系色调、白马牛仔荒漠场景等内容生成基础图像;CAP-004(风格切换与风格控制)通过加载油画/超现实主义风格LoRA或使用Midjourney --sref参数引导整体视觉风格,确保电影感油画氛围的精准呈现。两者组合可完整实现该需求。",
  1086. "match_status": "完全满足",
  1087. "needs_research": false,
  1088. "research_note": ""
  1089. },
  1090. {
  1091. "requirement_id": "REQ_068",
  1092. "requirement_text": "生成3D卡通风格的拟人化动物角色,角色具有毛绒质感和丰富的表情神态,能够在不同生活场景(办公室、卧室、户外)中呈现出喜怒哀乐等情绪状态,整体风格类似皮克斯动画",
  1093. "source_subtree": {
  1094. "parent_node": "艺术风格",
  1095. "parent_id": 15889,
  1096. "context_path": "/root/呈现/视觉/视觉气质/视觉风格/艺术风格"
  1097. },
  1098. "source_nodes": [
  1099. "绘画艺术",
  1100. "视觉冲击"
  1101. ],
  1102. "source_posts": [
  1103. "648d8edf0000000011013447",
  1104. "65eea166000000000d00c6d8",
  1105. "661dbf91000000001a0119b6",
  1106. "669b52720000000025003596",
  1107. "677b5460000000000b00d33e",
  1108. "686cd3a5000000000d0180b0",
  1109. "68a4107f000000001c00e8e9",
  1110. "68f9e8400000000005033268",
  1111. "692a535f0000000019026d5b",
  1112. "6960924b000000001a037a1c"
  1113. ],
  1114. "matched_capabilities": [
  1115. "CAP-001",
  1116. "CAP-004",
  1117. "CAP-003"
  1118. ],
  1119. "capability_combination": "CAP-001(文本到图像生成)通过提示词描述3D卡通风格、毛绒质感、皮克斯风格拟人化动物角色生成基础图像;CAP-004(风格切换与风格控制)通过加载皮克斯/3D卡通风格LoRA确保风格一致性;CAP-003(图像主体一致性保持)使用IP-Adapter或--cref参数,在切换不同场景(办公室/卧室/户外)和不同表情时保持角色外观特征一致。三者组合可完整实现该需求。",
  1120. "match_status": "完全满足",
  1121. "needs_research": false,
  1122. "research_note": ""
  1123. },
  1124. {
  1125. "requirement_id": "REQ_069",
  1126. "requirement_text": "制作融合插画风格的信息图文海报:以卡通机器人/科技感插图作为视觉主体,搭配醒目的彩色标题文字和数据图表,整体呈现出活泼又专业的视觉效果",
  1127. "source_subtree": {
  1128. "parent_node": "艺术风格",
  1129. "parent_id": 15889,
  1130. "context_path": "/root/呈现/视觉/视觉气质/视觉风格/艺术风格"
  1131. },
  1132. "source_nodes": [
  1133. "绘画艺术",
  1134. "极简风格"
  1135. ],
  1136. "source_posts": [
  1137. "648d8edf0000000011013447",
  1138. "65eea166000000000d00c6d8",
  1139. "661dbf91000000001a0119b6",
  1140. "669b52720000000025003596",
  1141. "677b5460000000000b00d33e",
  1142. "686cd3a5000000000d0180b0",
  1143. "68a4107f000000001c00e8e9",
  1144. "68f9e8400000000005033268",
  1145. "692a535f0000000019026d5b",
  1146. "6960924b000000001a037a1c"
  1147. ],
  1148. "matched_capabilities": [
  1149. "CAP-001",
  1150. "CAP-004",
  1151. "CAP-014"
  1152. ],
  1153. "capability_combination": "CAP-001(文本到图像生成)通过提示词生成卡通机器人/科技感插画风格的视觉主体;CAP-004(风格切换与风格控制)通过LoRA或风格参数确保插画风格的一致性和活泼专业感;CAP-014(图像内文字渲染)在生成图像中嵌入清晰可读的彩色标题文字。但数据图表部分(如柱状图、折线图等精确数据可视化元素)在现有能力中缺乏专项支持,AI图像生成对精确数据图表的还原度和准确性存在不确定性。",
  1154. "match_status": "需要调研",
  1155. "needs_research": true,
  1156. "research_note": "现有能力可以实现:插画风格卡通机器人主体生成(CAP-001+CAP-004)、标题文字渲染(CAP-014)。缺少的是:精确数据图表(柱状图、饼图、折线图等)的生成能力——AI图像生成工具对精确数值可视化的支持较弱,图表中的数字、刻度、比例可能不准确。需要调研:1)是否有AI工具能在图像中生成精确的数据图表元素;2)是否可以通过CAP-013(实时语境融合)结合数据生成准确图表;3)或者是否需要结合外部图表生成工具(如代码生成图表后与AI插画合成)来完整实现该需求。"
  1157. },
  1158. {
  1159. "requirement_id": "REQ_049",
  1160. "requirement_text": "将整个帖子内容拆分为多个独立小格子并排列成网格或矩阵布局,每个格子承载一个独立的场景或信息单元,格子之间有明显的分隔边界,整体看起来像一张由多张小图拼合而成的大图",
  1161. "source_subtree": {
  1162. "parent_node": "版面结构",
  1163. "parent_id": 15382,
  1164. "context_path": "/root/呈现/视觉/构图编排/版面设计/版面结构"
  1165. },
  1166. "source_nodes": [
  1167. "空间分割",
  1168. "内容组织",
  1169. "载体类型"
  1170. ],
  1171. "source_posts": [
  1172. "65eea166000000000d00c6d8",
  1173. "669b52720000000025003596",
  1174. "6711d712000000001b012783",
  1175. "6731b884000000001901b8d3",
  1176. "677b5460000000000b00d33e",
  1177. "68789450000000000b01d4a4",
  1178. "68a8241a000000001c011403",
  1179. "68e6ecb90000000003021e34",
  1180. "6960924b000000001a037a1c"
  1181. ],
  1182. "matched_capabilities": [
  1183. "CAP-001"
  1184. ],
  1185. "capability_combination": "CAP-001 可以通过提示词描述网格/矩阵布局来生成包含多格子分割的图像,但这属于对构图的语义描述,生成结果的精确性和可控性存疑",
  1186. "match_status": "需要调研",
  1187. "needs_research": true,
  1188. "research_note": "现有能力中 CAP-001 可通过提示词尝试生成网格布局图像,CAP-002 可通过结构控制约束构图,但两者均无法精确控制格子数量、边界粗细、每格内容的独立性和精确排列。核心缺口是:没有专门的版式/排版控制能力,无法像设计软件那样精确定义网格结构。需要调研:1)是否有 AI 工具支持精确的网格版式生成(如指定 3x3、2x4 等格数);2)是否可通过图像拼接后处理工具(非 AI 生成)实现,再结合 AI 生成各格内容;3)ComfyUI 是否有专门的图像拼接/网格排列节点"
  1189. },
  1190. {
  1191. "requirement_id": "REQ_050",
  1192. "requirement_text": "在同一张图中混合使用多种内容载体形式,例如将真实照片、插画角色、产品图、文字说明、图表等不同类型的视觉元素组合排布在同一个版面内,形成图文混排的丰富视觉层次",
  1193. "source_subtree": {
  1194. "parent_node": "版面结构",
  1195. "parent_id": 15382,
  1196. "context_path": "/root/呈现/视觉/构图编排/版面设计/版面结构"
  1197. },
  1198. "source_nodes": [
  1199. "载体类型",
  1200. "内容组织"
  1201. ],
  1202. "source_posts": [
  1203. "65eea166000000000d00c6d8",
  1204. "669b52720000000025003596",
  1205. "6711d712000000001b012783",
  1206. "6731b884000000001901b8d3",
  1207. "677b5460000000000b00d33e",
  1208. "68789450000000000b01d4a4",
  1209. "68a8241a000000001c011403",
  1210. "68e6ecb90000000003021e34",
  1211. "6960924b000000001a037a1c"
  1212. ],
  1213. "matched_capabilities": [
  1214. "CAP-001",
  1215. "CAP-014",
  1216. "CAP-020"
  1217. ],
  1218. "capability_combination": "CAP-001 可生成包含多种视觉元素的图像,CAP-014 可在图像中嵌入文字说明,CAP-020 可将多个主体合成到同一场景;三者组合可部分实现图文混排效果",
  1219. "match_status": "需要调研",
  1220. "needs_research": true,
  1221. "research_note": "现有能力可以:通过 CAP-001 生成混合风格图像、通过 CAP-014 嵌入文字、通过 CAP-020 合成多主体。但核心缺口是:1)无法精确控制不同类型视觉元素(照片风格 vs 插画风格 vs 图表)在同一画面中的独立性和精确位置排布;2)图表类元素(柱状图、折线图等)的精确生成能力不明确;3)版面排布的精确控制(指定某区域放产品图、某区域放文字说明)超出现有提示词控制的精度范围。需要调研:是否有 AI 工具支持分区域指定不同内容类型的版面合成能力,或是否需要结合设计工具(如 Canva、Figma)进行后期排版"
  1222. },
  1223. {
  1224. "requirement_id": "REQ_051",
  1225. "requirement_text": "以统一的视觉主角(如同一个卡通角色、同一个人物、同一主题场景)贯穿多个分格画面,每个格子呈现该主角在不同场景或状态下的样子,配合文字说明形成系列感强的多格叙事版式",
  1226. "source_subtree": {
  1227. "parent_node": "版面结构",
  1228. "parent_id": 15382,
  1229. "context_path": "/root/呈现/视觉/构图编排/版面设计/版面结构"
  1230. },
  1231. "source_nodes": [
  1232. "内容组织",
  1233. "空间分割"
  1234. ],
  1235. "source_posts": [
  1236. "65eea166000000000d00c6d8",
  1237. "669b52720000000025003596",
  1238. "6711d712000000001b012783",
  1239. "6731b884000000001901b8d3",
  1240. "677b5460000000000b00d33e",
  1241. "68789450000000000b01d4a4",
  1242. "68a8241a000000001c011403",
  1243. "68e6ecb90000000003021e34",
  1244. "6960924b000000001a037a1c"
  1245. ],
  1246. "matched_capabilities": [
  1247. "CAP-003",
  1248. "CAP-014",
  1249. "CAP-001"
  1250. ],
  1251. "capability_combination": "CAP-003 保持主角在不同场景中的外观一致性,CAP-001 生成各格不同场景内容,CAP-014 在图像中嵌入文字说明;但多格叙事版式的整体排版合成仍是缺口",
  1252. "match_status": "需要调研",
  1253. "needs_research": true,
  1254. "research_note": "现有能力可以:通过 CAP-003(IP-Adapter/--cref/多图参考)保持主角跨场景一致性,通过 CAP-001 生成各场景图像,通过 CAP-014 添加文字说明。但核心缺口是:1)将多张独立生成的分格图像拼合为统一的多格叙事版式(含分隔边界、文字区域、整体排版)的能力不在现有原子能力表中;2)单张图内精确划分多格并在每格内保持主角一致性的能力超出现有工具的直接支持范围。需要调研:1)是否有 AI 工具支持直接生成多格漫画/故事板版式;2)ComfyUI 是否有图像拼接节点可将多张图合并为网格版式;3)是否需要结合设计工具完成最终版式合成"
  1255. },
  1256. {
  1257. "requirement_id": "REQ_064",
  1258. "requirement_text": "生成具有强烈氛围感的插画风场景图,整体画面以深蓝色调为主,室内外场景都笼罩在宁静的夜色中,窗户透出暖黄色灯光形成冷暖对比,画面质感接近油画或数字绘画风格,传达出静谧、沉思、略带忧郁的情绪氛围",
  1259. "source_subtree": {
  1260. "parent_node": "氛围基调",
  1261. "parent_id": 15890,
  1262. "context_path": "/root/呈现/视觉/视觉气质/视觉风格/氛围基调"
  1263. },
  1264. "source_nodes": [
  1265. "柔和舒适",
  1266. "庄重宏大"
  1267. ],
  1268. "source_posts": [
  1269. "61bdc28b0000000001024896",
  1270. "676f8eac000000000902f53e",
  1271. "67fd299a000000001c00cf5d",
  1272. "681c64ce000000002200554c",
  1273. "6880a7a7000000000b02f5a6",
  1274. "68f568a1000000000301053d",
  1275. "69003bb30000000004015797",
  1276. "6960e87a000000000e00c216",
  1277. "6964beb3000000002103361a"
  1278. ],
  1279. "matched_capabilities": [
  1280. "CAP-001",
  1281. "CAP-004"
  1282. ],
  1283. "capability_combination": "CAP-001(文本到图像生成)通过详细提示词描述深蓝色调、夜色氛围、冷暖对比光效等内容要素生成基础图像;CAP-004(风格切换与风格控制)通过加载油画/数字绘画风格LoRA或使用Midjourney --sref风格参考,将画面渲染为指定插画艺术风格,两者组合可完整实现该需求。",
  1284. "match_status": "完全满足",
  1285. "needs_research": false,
  1286. "research_note": ""
  1287. },
  1288. {
  1289. "requirement_id": "REQ_065",
  1290. "requirement_text": "制作色彩鲜艳、视觉冲击力强的宣传海报,背景使用渐变色块(蓝紫、橙红等高饱和度色彩),搭配几何抽象图形装饰,文字排版醒目大气,整体呈现出热烈、充满活力的欢庆氛围",
  1291. "source_subtree": {
  1292. "parent_node": "氛围基调",
  1293. "parent_id": 15890,
  1294. "context_path": "/root/呈现/视觉/视觉气质/视觉风格/氛围基调"
  1295. },
  1296. "source_nodes": [
  1297. "欢庆热闹",
  1298. "庄重宏大"
  1299. ],
  1300. "source_posts": [
  1301. "61bdc28b0000000001024896",
  1302. "676f8eac000000000902f53e",
  1303. "67fd299a000000001c00cf5d",
  1304. "681c64ce000000002200554c",
  1305. "6880a7a7000000000b02f5a6",
  1306. "68f568a1000000000301053d",
  1307. "69003bb30000000004015797",
  1308. "6960e87a000000000e00c216",
  1309. "6964beb3000000002103361a"
  1310. ],
  1311. "matched_capabilities": [
  1312. "CAP-001",
  1313. "CAP-014"
  1314. ],
  1315. "capability_combination": "CAP-001(文本到图像生成)通过提示词描述高饱和度渐变色块背景、几何抽象图形装饰、欢庆活力氛围等视觉要素生成海报底图;CAP-014(图像内文字渲染)利用Nano Banana Pro或Midjourney v8的文字渲染能力,在海报中嵌入醒目大气的排版文字,两者组合可完整实现该宣传海报需求。",
  1316. "match_status": "完全满足",
  1317. "needs_research": false,
  1318. "research_note": ""
  1319. },
  1320. {
  1321. "requirement_id": "REQ_066",
  1322. "requirement_text": "生成暖色调的室内空间效果图,以米白、浅棕、焦糖色为主色调,光线柔和自然,空间布置温馨舒适,整体画面传达出放松、治愈、生活化的温暖氛围",
  1323. "source_subtree": {
  1324. "parent_node": "氛围基调",
  1325. "parent_id": 15890,
  1326. "context_path": "/root/呈现/视觉/视觉气质/视觉风格/氛围基调"
  1327. },
  1328. "source_nodes": [
  1329. "柔和舒适"
  1330. ],
  1331. "source_posts": [
  1332. "61bdc28b0000000001024896",
  1333. "676f8eac000000000902f53e",
  1334. "67fd299a000000001c00cf5d",
  1335. "681c64ce000000002200554c",
  1336. "6880a7a7000000000b02f5a6",
  1337. "68f568a1000000000301053d",
  1338. "69003bb30000000004015797",
  1339. "6960e87a000000000e00c216",
  1340. "6964beb3000000002103361a"
  1341. ],
  1342. "matched_capabilities": [
  1343. "CAP-001"
  1344. ],
  1345. "capability_combination": "CAP-001(文本到图像生成)通过详细提示词描述米白/浅棕/焦糖色主色调、柔和自然光线、温馨舒适室内布置等要素,使用ComfyUI、Midjourney v8或Nano Banana Pro等工具直接生成室内空间效果图,完整实现该需求。",
  1346. "match_status": "完全满足",
  1347. "needs_research": false,
  1348. "research_note": ""
  1349. },
  1350. {
  1351. "requirement_id": "REQ_010",
  1352. "requirement_text": "制作多格宫格式信息图,将同类内容(如多种食材搭配方案)拆分为统一风格的小卡片,每格包含标题、食材图片和文字说明,整体排列整齐、色块鲜明,适合一图展示多个并列条目",
  1353. "source_subtree": {
  1354. "parent_node": "版面设计",
  1355. "parent_id": 15906,
  1356. "context_path": "/root/呈现/视觉/构图编排/版面设计"
  1357. },
  1358. "source_nodes": [
  1359. "辅助元素",
  1360. "文字动效"
  1361. ],
  1362. "source_posts": [
  1363. "67299a19000000001901483f",
  1364. "6732f52f000000001b013fdb",
  1365. "675c0669000000000600cfd7",
  1366. "6776b27d0000000013018545",
  1367. "678ce28d000000001603e3a8",
  1368. "69200dec000000001f00b884",
  1369. "692e7ccf000000001f00a137",
  1370. "694a6caf000000001f00e112"
  1371. ],
  1372. "matched_capabilities": [
  1373. "CAP-001",
  1374. "CAP-014"
  1375. ],
  1376. "capability_combination": "CAP-001 可生成统一风格的食材图片素材,CAP-014 可在图像中嵌入标题和文字说明;但两者组合仍无法直接实现多格宫格排版布局、色块分割、多卡片整齐排列等版式设计能力",
  1377. "match_status": "需要调研",
  1378. "needs_research": true,
  1379. "research_note": "现有能力中 CAP-001 可生成图像内容,CAP-014 可渲染图内文字,但缺少专门的多格宫格版式排版能力——即将多个卡片(含图片+标题+文字)按网格结构整齐排列、色块分明地组合为一张信息图的能力。需要调研:1)AI 图像生成工具是否支持通过提示词直接生成宫格信息图版式;2)是否有专门的信息图/排版生成工具(如 Canva AI、Adobe Firefly 等)支持此类结构化多格布局;3)Nano Banana Pro 或 FLUX.2 的复杂排版提示词能力是否能覆盖此场景。"
  1380. },
  1381. {
  1382. "requirement_id": "REQ_011",
  1383. "requirement_text": "在图片上叠加标注元素,如用红色圆点、箭头或emoji符号指向图中特定位置,配合说明文字,实现在真实照片上直观标记关键信息的视觉效果",
  1384. "source_subtree": {
  1385. "parent_node": "版面设计",
  1386. "parent_id": 15906,
  1387. "context_path": "/root/呈现/视觉/构图编排/版面设计"
  1388. },
  1389. "source_nodes": [
  1390. "辅助元素"
  1391. ],
  1392. "source_posts": [
  1393. "67299a19000000001901483f",
  1394. "6732f52f000000001b013fdb",
  1395. "675c0669000000000600cfd7",
  1396. "6776b27d0000000013018545",
  1397. "678ce28d000000001603e3a8",
  1398. "69200dec000000001f00b884",
  1399. "692e7ccf000000001f00a137",
  1400. "694a6caf000000001f00e112"
  1401. ],
  1402. "matched_capabilities": [
  1403. "CAP-012",
  1404. "CAP-014"
  1405. ],
  1406. "capability_combination": "CAP-012 可对图像局部区域进行重绘以叠加视觉元素,CAP-014 可在图像中渲染说明文字;但两者组合无法精准控制在指定坐标位置叠加箭头、圆点、emoji等标注符号",
  1407. "match_status": "需要调研",
  1408. "needs_research": true,
  1409. "research_note": "现有能力中 CAP-012 局部重绘可在图像特定区域添加内容,CAP-014 可渲染文字,但缺少精准坐标定位叠加标注元素的能力——即在图像指定像素位置精确放置红色圆点、箭头、emoji等标注符号并与说明文字配合的能力。AI 图像生成工具通常无法保证标注元素出现在精确指定的位置。需要调研:1)是否有 AI 工具支持通过坐标或区域描述精准叠加标注元素;2)Nano Banana Pro 或 FLUX.2 的图像编辑模式是否能通过提示词在指定位置添加箭头/圆点标注;3)是否需要结合非 AI 的图像编辑工具(如 Python PIL、Figma)来实现精准标注叠加。"
  1410. },
  1411. {
  1412. "requirement_id": "REQ_012",
  1413. "requirement_text": "制作图文混排的长图文内容,将大段文字与人物照片、数据表格、流程图等多种视觉元素组合排布在同一版面中,形成类似杂志或报告的专业排版风格",
  1414. "source_subtree": {
  1415. "parent_node": "版面设计",
  1416. "parent_id": 15906,
  1417. "context_path": "/root/呈现/视觉/构图编排/版面设计"
  1418. },
  1419. "source_nodes": [
  1420. "辅助元素",
  1421. "文字动效"
  1422. ],
  1423. "source_posts": [
  1424. "67299a19000000001901483f",
  1425. "6732f52f000000001b013fdb",
  1426. "675c0669000000000600cfd7",
  1427. "6776b27d0000000013018545",
  1428. "678ce28d000000001603e3a8",
  1429. "69200dec000000001f00b884",
  1430. "692e7ccf000000001f00a137",
  1431. "694a6caf000000001f00e112"
  1432. ],
  1433. "matched_capabilities": [
  1434. "CAP-001",
  1435. "CAP-014"
  1436. ],
  1437. "capability_combination": "CAP-001 可生成人物照片等图像素材,CAP-014 可在图像中渲染文字内容;但两者组合无法实现大段文字+多种视觉元素(表格、流程图、照片)在同一版面中的专业排版布局",
  1438. "match_status": "需要调研",
  1439. "needs_research": true,
  1440. "research_note": "现有能力中 CAP-001 可生成图像素材,CAP-014 可渲染图内文字,但缺少长图文专业排版能力——即将大段文字、人物照片、数据表格、流程图等异质元素按杂志/报告风格进行多栏布局、层次排版、精确对齐的能力。AI 图像生成工具不擅长处理结构化的长版面排版,尤其是数据表格和流程图的精确渲染。需要调研:1)是否有 AI 工具支持生成包含多种元素混排的长图文版面;2)Nano Banana Pro 的复杂排版布局能力(使用介绍 3.1 节提及支持复杂排版布局)是否能覆盖此场景;3)是否需要结合专业排版工具(如 Adobe InDesign AI 功能、Canva AI)来实现此类专业图文混排效果。"
  1441. },
  1442. {
  1443. "requirement_id": "REQ_013",
  1444. "requirement_text": "生成以暖黄/米棕色为背景底色的图文排版内容,整体画面呈现温暖、复古的暖色调氛围,适合健康养生、生活方式类主题",
  1445. "source_subtree": {
  1446. "parent_node": "色彩调性",
  1447. "parent_id": 15907,
  1448. "context_path": "/root/呈现/视觉/视觉气质/色彩调性"
  1449. },
  1450. "source_nodes": [
  1451. "背景底色",
  1452. "色调倾向"
  1453. ],
  1454. "source_posts": [
  1455. "66c5b638000000001d018e5a",
  1456. "6837f1270000000012006c8e",
  1457. "6874c80e000000000d027767",
  1458. "68b10b46000000001c00ca6c",
  1459. "69535514000000001e032b26",
  1460. "696078f70000000022038479",
  1461. "6964573a000000000d00800e",
  1462. "6969068e000000000d008b48"
  1463. ],
  1464. "matched_capabilities": [
  1465. "CAP-001"
  1466. ],
  1467. "capability_combination": "CAP-001(文本到图像生成)通过在提示词中详细描述暖黄/米棕色背景、温暖复古暖色调氛围及健康养生主题,可直接生成符合要求的图像。Midjourney v8、FLUX.2 [max]、Nano Banana Pro、Seedream 5.0 Lite 均支持通过提示词精确控制色调和氛围。若需图文排版中含有文字元素,可结合 CAP-014(图像内文字渲染)实现。",
  1468. "match_status": "完全满足",
  1469. "needs_research": false,
  1470. "research_note": ""
  1471. },
  1472. {
  1473. "requirement_id": "REQ_014",
  1474. "requirement_text": "生成以深色(黑色/深蓝/深紫)为背景底色的海报,搭配霓虹感彩色光效(橙、紫、青等),营造出科技感强烈的冷暖对比配色效果",
  1475. "source_subtree": {
  1476. "parent_node": "色彩调性",
  1477. "parent_id": 15907,
  1478. "context_path": "/root/呈现/视觉/视觉气质/色彩调性"
  1479. },
  1480. "source_nodes": [
  1481. "背景底色",
  1482. "配色组合",
  1483. "色调倾向"
  1484. ],
  1485. "source_posts": [
  1486. "66c5b638000000001d018e5a",
  1487. "6837f1270000000012006c8e",
  1488. "6874c80e000000000d027767",
  1489. "68b10b46000000001c00ca6c",
  1490. "69535514000000001e032b26",
  1491. "696078f70000000022038479",
  1492. "6964573a000000000d00800e",
  1493. "6969068e000000000d008b48"
  1494. ],
  1495. "matched_capabilities": [
  1496. "CAP-001",
  1497. "CAP-014"
  1498. ],
  1499. "capability_combination": "CAP-001(文本到图像生成)通过提示词描述深色背景(黑色/深蓝/深紫)、霓虹光效(橙/紫/青)、科技感冷暖对比配色,可直接生成符合要求的海报图像;若海报含文字内容,结合 CAP-014(图像内文字渲染)在生成阶段嵌入清晰可读的文字元素。Midjourney v8 和 FLUX.2 [max] 对科技感霓虹风格的提示词遵循性强,效果尤为突出。",
  1500. "match_status": "完全满足",
  1501. "needs_research": false,
  1502. "research_note": ""
  1503. },
  1504. {
  1505. "requirement_id": "REQ_015",
  1506. "requirement_text": "生成整体色调偏粉紫、薄荷绿、浅蓝等低饱和度冷色系的插画或场景图,画面呈现出梦幻、静谧的冷色调氛围,颜色搭配柔和克制",
  1507. "source_subtree": {
  1508. "parent_node": "色彩调性",
  1509. "parent_id": 15907,
  1510. "context_path": "/root/呈现/视觉/视觉气质/色彩调性"
  1511. },
  1512. "source_nodes": [
  1513. "色调倾向",
  1514. "配色组合"
  1515. ],
  1516. "source_posts": [
  1517. "66c5b638000000001d018e5a",
  1518. "6837f1270000000012006c8e",
  1519. "6874c80e000000000d027767",
  1520. "68b10b46000000001c00ca6c",
  1521. "69535514000000001e032b26",
  1522. "696078f70000000022038479",
  1523. "6964573a000000000d00800e",
  1524. "6969068e000000000d008b48"
  1525. ],
  1526. "matched_capabilities": [
  1527. "CAP-001",
  1528. "CAP-004"
  1529. ],
  1530. "capability_combination": "CAP-001(文本到图像生成)通过提示词描述粉紫、薄荷绿、浅蓝等低饱和度冷色系、梦幻静谧氛围,可直接生成符合要求的插画或场景图;CAP-004(风格切换与风格控制)可通过 --sref 风格参考图或 LoRA 模型进一步精确控制插画风格和色调倾向,确保低饱和度冷色系的柔和克制感稳定输出。两者结合可高度还原目标视觉效果。",
  1531. "match_status": "完全满足",
  1532. "needs_research": false,
  1533. "research_note": ""
  1534. },
  1535. {
  1536. "requirement_id": "REQ_016",
  1537. "requirement_text": "生成手部持握或展示物品的特写画面,手势自然,物品清晰呈现,如用手托举饺子、手持卡片、手握手机等,突出手与物品的互动关系",
  1538. "source_subtree": {
  1539. "parent_node": "动作姿态",
  1540. "parent_id": 15901,
  1541. "context_path": "/root/呈现/视觉/形象塑造/人物表现/动作姿态"
  1542. },
  1543. "source_nodes": [
  1544. "手部动作",
  1545. "创意动作"
  1546. ],
  1547. "source_posts": [
  1548. "6649dbe3000000000c018112",
  1549. "6687d458000000000a026f91",
  1550. "66daeddb000000002603ea42",
  1551. "682086dc0000000012003cbd",
  1552. "683d8695000000001200012a",
  1553. "68708544000000000d026732",
  1554. "68e9b94d0000000007036a6a",
  1555. "692c3402000000000d03b7b7"
  1556. ],
  1557. "matched_capabilities": [
  1558. "CAP-001",
  1559. "CAP-002"
  1560. ],
  1561. "capability_combination": "CAP-001 通过详细提示词描述手部姿态与物品互动关系生成基础图像;CAP-002 使用 OpenPose 骨架控制手部姿态精度,确保手势自然;Midjourney v8 在 CAP-001 实现中对手部解剖结构有明显改进,可优先选用",
  1562. "match_status": "需要调研",
  1563. "needs_research": true,
  1564. "research_note": "手部生成是 AI 图像生成的传统难点。CAP-001 可通过提示词描述手部动作,CAP-002 的 OpenPose 可提供骨架约束,但手部细节(手指数量、弯曲角度、与物品的接触关系)在现有能力中仍难以精确控制。Midjourney v8 虽声称改进了手部解剖结构,但尚无明确的手部特写专项能力说明。需要调研:1)是否有专门针对手部生成优化的 ControlNet 模型(如 HandRefiner);2)Midjourney v8 手部改进的实际效果是否满足特写级别的精度要求;3)是否需要结合 CAP-012 局部重绘对手部区域进行修复"
  1565. },
  1566. {
  1567. "requirement_id": "REQ_017",
  1568. "requirement_text": "生成多人或多只动物同框的协同姿态画面,如两只猫并排躺着穿睡衣、两人一起摆造型抱花束,呈现出同步、对称或互动的视觉效果",
  1569. "source_subtree": {
  1570. "parent_node": "动作姿态",
  1571. "parent_id": 15901,
  1572. "context_path": "/root/呈现/视觉/形象塑造/人物表现/动作姿态"
  1573. },
  1574. "source_nodes": [
  1575. "协同动作",
  1576. "行为概念"
  1577. ],
  1578. "source_posts": [
  1579. "6649dbe3000000000c018112",
  1580. "6687d458000000000a026f91",
  1581. "66daeddb000000002603ea42",
  1582. "682086dc0000000012003cbd",
  1583. "683d8695000000001200012a",
  1584. "68708544000000000d026732",
  1585. "68e9b94d0000000007036a6a",
  1586. "692c3402000000000d03b7b7"
  1587. ],
  1588. "matched_capabilities": [
  1589. "CAP-001",
  1590. "CAP-002",
  1591. "CAP-020"
  1592. ],
  1593. "capability_combination": "CAP-020 支持多主体合成到同一场景;CAP-002 使用 OpenPose 骨架同时控制多个主体的姿态,实现同步/对称/互动的协同姿态;CAP-001 通过提示词描述协同动作语义;三者组合:先用 CAP-002 定义多主体骨架姿态,再用 CAP-001 生成内容,CAP-020 确保多主体外观一致性",
  1594. "match_status": "需要调研",
  1595. "needs_research": true,
  1596. "research_note": "现有能力可部分支持:CAP-001 可通过提示词描述多主体协同场景,CAP-020 可合成多主体,CAP-002 可控制姿态骨架。但核心挑战在于:1)多主体同框时各自姿态的精确协同控制(如两只猫完全对称并排)在 OpenPose 多人骨架控制中存在主体混淆风险;2)动物(猫)的姿态骨架控制与人体 OpenPose 不同,需要调研是否有动物姿态 ControlNet 模型;3)多主体协同的对称/同步视觉效果是否能通过现有工具稳定复现,需要调研实际效果"
  1597. },
  1598. {
  1599. "requirement_id": "REQ_018",
  1600. "requirement_text": "生成创意性的嘴部动作特写,如用嘴唇衔住花朵茎部形成'嘴唇花'的视觉效果,将身体部位与物品结合产生趣味创意画面",
  1601. "source_subtree": {
  1602. "parent_node": "动作姿态",
  1603. "parent_id": 15901,
  1604. "context_path": "/root/呈现/视觉/形象塑造/人物表现/动作姿态"
  1605. },
  1606. "source_nodes": [
  1607. "创意动作",
  1608. "手部动作"
  1609. ],
  1610. "source_posts": [
  1611. "6649dbe3000000000c018112",
  1612. "6687d458000000000a026f91",
  1613. "66daeddb000000002603ea42",
  1614. "682086dc0000000012003cbd",
  1615. "683d8695000000001200012a",
  1616. "68708544000000000d026732",
  1617. "68e9b94d0000000007036a6a",
  1618. "692c3402000000000d03b7b7"
  1619. ],
  1620. "matched_capabilities": [
  1621. "CAP-001"
  1622. ],
  1623. "capability_combination": "CAP-001 通过详细提示词描述嘴部与物品的创意互动关系生成图像;可结合 Midjourney v8 或 FLUX.2 [max] 的照片级真实感能力生成特写画面",
  1624. "match_status": "需要调研",
  1625. "needs_research": true,
  1626. "research_note": "现有 CAP-001 可通过提示词尝试生成此类创意特写,但存在以下不确定性:1)嘴部特写中嘴唇与细长物体(花茎)的精确接触关系难以通过提示词精确控制,AI 模型容易生成解剖不自然的结果;2)CAP-002 的 OpenPose 主要针对全身/上半身骨架,对嘴部局部动作的精细控制能力不明确;3)此类创意合成画面(身体部位与物品融合产生视觉双关效果)对模型的创意理解和精确执行能力要求较高。需要调研:1)是否有面部/嘴部局部 ControlNet 控制方案;2)FLUX.2 [max] 或 Midjourney v8 对此类创意提示词的实际执行效果;3)是否需要结合 CAP-012 局部重绘对嘴部区域进行精细调整"
  1627. },
  1628. {
  1629. "requirement_id": "REQ_052",
  1630. "requirement_text": "将多张图片按网格或分区方式拼贴成一张图,每个区域展示不同角度或不同场景,整体画面有清晰的分割感和节奏感",
  1631. "source_subtree": {
  1632. "parent_node": "元素编排",
  1633. "parent_id": 15883,
  1634. "context_path": "/root/呈现/视觉/构图编排/空间布局/元素编排"
  1635. },
  1636. "source_nodes": [
  1637. "排列节奏",
  1638. "组合关系",
  1639. "布局规划"
  1640. ],
  1641. "source_posts": [
  1642. "61bdc28b0000000001024896",
  1643. "65eea166000000000d00c6d8",
  1644. "65f4359b00000000140079b5",
  1645. "6732cd8a000000001b02f948",
  1646. "6746fb5600000000070260ce",
  1647. "68737e97000000000d027b81",
  1648. "693f94d80000000019025898",
  1649. "696f2f97000000000e00e33c"
  1650. ],
  1651. "matched_capabilities": [],
  1652. "capability_combination": "",
  1653. "match_status": "需要调研",
  1654. "needs_research": true,
  1655. "research_note": "现有能力表中没有直接支持多图网格拼贴/分区排版的能力。CAP-001文本到图像生成理论上可以通过提示词描述网格布局来生成类似效果,但无法精确控制每个区域放置指定的已有图片内容。CAP-008批量图像生成只能批量产出独立图像,不能将多张图合并为网格布局。需要调研:1)是否有AI工具支持将多张已有图片自动排列为网格/分区拼贴图的能力;2)ComfyUI是否有图像拼接/网格合成节点;3)是否可通过提示词精确控制多分区画面布局并在每个分区生成不同内容。"
  1656. },
  1657. {
  1658. "requirement_id": "REQ_053",
  1659. "requirement_text": "在同一画面中合理安排主体与背景的空间关系,让主体(人物、动物、物品)在画面中有明确的视觉焦点,背景简洁或有层次地衬托主体",
  1660. "source_subtree": {
  1661. "parent_node": "元素编排",
  1662. "parent_id": 15883,
  1663. "context_path": "/root/呈现/视觉/构图编排/空间布局/元素编排"
  1664. },
  1665. "source_nodes": [
  1666. "视线焦点",
  1667. "疏密比例",
  1668. "空间拓展"
  1669. ],
  1670. "source_posts": [
  1671. "61bdc28b0000000001024896",
  1672. "65eea166000000000d00c6d8",
  1673. "65f4359b00000000140079b5",
  1674. "6732cd8a000000001b02f948",
  1675. "6746fb5600000000070260ce",
  1676. "68737e97000000000d027b81",
  1677. "693f94d80000000019025898",
  1678. "696f2f97000000000e00e33c"
  1679. ],
  1680. "matched_capabilities": [
  1681. "CAP-001",
  1682. "CAP-002",
  1683. "CAP-003"
  1684. ],
  1685. "capability_combination": "CAP-001通过提示词描述主体与背景的构图关系(如主体居中/前景突出/背景虚化等)来控制视觉焦点;CAP-002通过ControlNet结构控制确保主体在画面中的位置和姿态符合预期构图;CAP-003在需要保持特定主体外观的场景下,确保主体特征一致的同时配合背景生成,三者组合可实现主体突出、背景衬托的构图效果。",
  1686. "match_status": "完全满足",
  1687. "needs_research": false,
  1688. "research_note": ""
  1689. },
  1690. {
  1691. "requirement_id": "REQ_054",
  1692. "requirement_text": "生成包含多个独立小格子的图文排版画面,每个格子内有图片和文字说明,格子之间疏密有致、整齐排列,整体呈现信息图表或内容合集的视觉效果",
  1693. "source_subtree": {
  1694. "parent_node": "元素编排",
  1695. "parent_id": 15883,
  1696. "context_path": "/root/呈现/视觉/构图编排/空间布局/元素编排"
  1697. },
  1698. "source_nodes": [
  1699. "布局规划",
  1700. "疏密比例",
  1701. "排列节奏"
  1702. ],
  1703. "source_posts": [
  1704. "61bdc28b0000000001024896",
  1705. "65eea166000000000d00c6d8",
  1706. "65f4359b00000000140079b5",
  1707. "6732cd8a000000001b02f948",
  1708. "6746fb5600000000070260ce",
  1709. "68737e97000000000d027b81",
  1710. "693f94d80000000019025898",
  1711. "696f2f97000000000e00e33c"
  1712. ],
  1713. "matched_capabilities": [
  1714. "CAP-001",
  1715. "CAP-014"
  1716. ],
  1717. "capability_combination": "CAP-001可通过提示词描述信息图表/内容合集的整体视觉风格来生成类似布局;CAP-014支持在图像中渲染清晰可读的文字内容,可在格子内嵌入文字说明。但两者组合仍难以精确控制每个格子的独立内容(图片+文字的精确对应关系)。",
  1718. "match_status": "需要调研",
  1719. "needs_research": true,
  1720. "research_note": "现有能力中CAP-001+CAP-014可以生成整体上具有图文排版感的画面,CAP-014支持文字渲染。但核心缺口在于:无法精确控制多个独立格子中每个格子的图片内容与文字说明的精确对应关系,也无法保证格子数量、间距、疏密的精确排版控制。需要调研:1)AI图像生成工具是否支持结构化多格子图文排版的精确布局控制;2)是否有专门的信息图表/卡片合集生成能力;3)ComfyUI是否有支持图文混排网格布局的节点方案。"
  1721. },
  1722. {
  1723. "requirement_id": "REQ_088",
  1724. "requirement_text": "生成超现实浪漫场景图:将人物置于不可能存在的宏大环境中,如站在地球边缘俯瞰星空、坐在云端长椅上漂浮、在星海上骑行,画面充满梦幻感和史诗级视觉冲击力",
  1725. "source_subtree": {
  1726. "parent_node": "审美取向",
  1727. "parent_id": 15903,
  1728. "context_path": "/root/呈现/视觉/视觉气质/视觉风格/艺术风格/审美取向"
  1729. },
  1730. "source_nodes": [
  1731. "幻想虚构",
  1732. "创意表现"
  1733. ],
  1734. "source_posts": [
  1735. "648d8edf0000000011013447",
  1736. "6727171b000000001b01114b",
  1737. "681c64ce000000002200554c",
  1738. "689b158f000000001b03e512",
  1739. "68e6ecb90000000003021e34",
  1740. "69535514000000001e032b26",
  1741. "6965d491000000000e00f9b0",
  1742. "696b5332000000002103c497"
  1743. ],
  1744. "matched_capabilities": [
  1745. "CAP-001",
  1746. "CAP-004"
  1747. ],
  1748. "capability_combination": "CAP-001(文本到图像生成)是核心能力,通过详细的提示词描述超现实场景(地球边缘、云端、星海等)直接生成图像,FLUX.2 [max]、Midjourney v8 或 Nano Banana Pro 均可胜任此类幻想场景生成;CAP-004(风格切换与风格控制)可通过 --sref 或 LoRA 进一步强化梦幻/史诗视觉风格,确保画面氛围符合预期。",
  1749. "match_status": "完全满足",
  1750. "needs_research": false,
  1751. "research_note": ""
  1752. },
  1753. {
  1754. "requirement_id": "REQ_089",
  1755. "requirement_text": "制作科技感强烈的活动宣传海报:使用深色背景配合橙色、蓝色等高对比度霓虹色调,融合未来感城市或科技场景插图,搭配大号粗体标题文字,整体呈现出硬核、前沿的视觉气质",
  1756. "source_subtree": {
  1757. "parent_node": "审美取向",
  1758. "parent_id": 15903,
  1759. "context_path": "/root/呈现/视觉/视觉气质/视觉风格/艺术风格/审美取向"
  1760. },
  1761. "source_nodes": [
  1762. "概念气质",
  1763. "创意表现",
  1764. "风格融合"
  1765. ],
  1766. "source_posts": [
  1767. "648d8edf0000000011013447",
  1768. "6727171b000000001b01114b",
  1769. "681c64ce000000002200554c",
  1770. "689b158f000000001b03e512",
  1771. "68e6ecb90000000003021e34",
  1772. "69535514000000001e032b26",
  1773. "6965d491000000000e00f9b0",
  1774. "696b5332000000002103c497"
  1775. ],
  1776. "matched_capabilities": [
  1777. "CAP-001",
  1778. "CAP-004",
  1779. "CAP-014"
  1780. ],
  1781. "capability_combination": "CAP-001(文本到图像生成)生成深色背景+霓虹色调+未来感城市场景的海报底图;CAP-004(风格切换与风格控制)通过风格参考图或 LoRA 强化赛博朋克/科技感视觉风格;CAP-014(图像内文字渲染)在海报中嵌入大号粗体标题文字,Nano Banana Pro 文本准确率最高(94-96%),Midjourney v8 也有改进的文本渲染能力,三者组合可完整实现该海报需求。",
  1782. "match_status": "完全满足",
  1783. "needs_research": false,
  1784. "research_note": ""
  1785. },
  1786. {
  1787. "requirement_id": "REQ_090",
  1788. "requirement_text": "生成融合东方传统与现代简约的室内空间效果图:以米白、暖棕为主色调,加入拱形门洞、藤编元素、中式花卉装饰画等传统细节,整体呈现温润雅致的新中式生活美学氛围",
  1789. "source_subtree": {
  1790. "parent_node": "审美取向",
  1791. "parent_id": 15903,
  1792. "context_path": "/root/呈现/视觉/视觉气质/视觉风格/艺术风格/审美取向"
  1793. },
  1794. "source_nodes": [
  1795. "民俗传统",
  1796. "风格融合",
  1797. "概念气质"
  1798. ],
  1799. "source_posts": [
  1800. "648d8edf0000000011013447",
  1801. "6727171b000000001b01114b",
  1802. "681c64ce000000002200554c",
  1803. "689b158f000000001b03e512",
  1804. "68e6ecb90000000003021e34",
  1805. "69535514000000001e032b26",
  1806. "6965d491000000000e00f9b0",
  1807. "696b5332000000002103c497"
  1808. ],
  1809. "matched_capabilities": [
  1810. "CAP-001",
  1811. "CAP-004"
  1812. ],
  1813. "capability_combination": "CAP-001(文本到图像生成)是核心能力,通过详细提示词描述室内空间构成要素(米白暖棕色调、拱形门洞、藤编元素、中式花卉装饰画等)直接生成效果图,ComfyUI 案例5「建筑效果图快速出图」和 FLUX.2 [max] 均支持室内设计效果图生成;CAP-004(风格切换与风格控制)通过新中式风格 LoRA 或风格参考图精准控制东方传统与现代简约融合的视觉风格,确保氛围准确。",
  1814. "match_status": "完全满足",
  1815. "needs_research": false,
  1816. "research_note": ""
  1817. },
  1818. {
  1819. "requirement_id": "REQ_034",
  1820. "requirement_text": "生成真实户外场景中的人物活动照片,画面要呈现自然光线下的街道、公园、游乐场等具体地点环境,人物动作自然生动,背景环境细节丰富真实",
  1821. "source_subtree": {
  1822. "parent_node": "场景人物",
  1823. "parent_id": 15891,
  1824. "context_path": "/root/呈现/视觉/影像制作/实景拍摄/场景人物"
  1825. },
  1826. "source_nodes": [
  1827. "场景取景",
  1828. "环境取景"
  1829. ],
  1830. "source_posts": [
  1831. "66f51b90000000002a036660",
  1832. "6732cd8a000000001b02f948",
  1833. "677b5460000000000b00d33e",
  1834. "68a4107f000000001c00e8e9",
  1835. "68abe632000000001c0348c0",
  1836. "6913cafd000000000703402b",
  1837. "69647323000000001a01ef60"
  1838. ],
  1839. "matched_capabilities": [
  1840. "CAP-001",
  1841. "CAP-002",
  1842. "CAP-006"
  1843. ],
  1844. "capability_combination": "CAP-001(文本到图像生成)通过详细提示词描述户外场景、自然光线、具体地点和人物动作,利用 FLUX.2 [max] 或 Midjourney v8 的照片级真实感能力生成基础图像;CAP-002(结构/姿态控制生成)通过 ControlNet + OpenPose 控制人物动作姿态使其自然生动;CAP-006(图像细节增强与高清放大)对背景环境细节进行增强,使场景细节更丰富真实。",
  1845. "match_status": "完全满足",
  1846. "needs_research": false,
  1847. "research_note": ""
  1848. },
  1849. {
  1850. "requirement_id": "REQ_035",
  1851. "requirement_text": "生成多人聚集的活动现场图,如会议、展览、户外聚会等场景,画面中需要呈现多个人物同框、有组织的群体互动氛围,背景有明显的活动标识或场地特征",
  1852. "source_subtree": {
  1853. "parent_node": "场景人物",
  1854. "parent_id": 15891,
  1855. "context_path": "/root/呈现/视觉/影像制作/实景拍摄/场景人物"
  1856. },
  1857. "source_nodes": [
  1858. "群像合影",
  1859. "集体演出"
  1860. ],
  1861. "source_posts": [
  1862. "66f51b90000000002a036660",
  1863. "6732cd8a000000001b02f948",
  1864. "677b5460000000000b00d33e",
  1865. "68a4107f000000001c00e8e9",
  1866. "68abe632000000001c0348c0",
  1867. "6913cafd000000000703402b",
  1868. "69647323000000001a01ef60"
  1869. ],
  1870. "matched_capabilities": [
  1871. "CAP-001",
  1872. "CAP-020",
  1873. "CAP-014"
  1874. ],
  1875. "capability_combination": "CAP-001(文本到图像生成)通过提示词描述多人聚集场景、活动类型和群体互动氛围生成基础图像;CAP-020(多主体场景合成)在需要特定人物出现时,将多个人物参考图合成到同一活动场景中,保持各人物外观一致;CAP-014(图像内文字渲染)在背景中渲染活动标识、横幅、标牌等文字元素,强化活动场地特征。",
  1876. "match_status": "完全满足",
  1877. "needs_research": false,
  1878. "research_note": ""
  1879. },
  1880. {
  1881. "requirement_id": "REQ_036",
  1882. "requirement_text": "生成真实物品的特写或陈列展示图,物品摆放清晰、细节可辨,适合用于产品展示或场景道具呈现,画面构图干净突出主体",
  1883. "source_subtree": {
  1884. "parent_node": "场景人物",
  1885. "parent_id": 15891,
  1886. "context_path": "/root/呈现/视觉/影像制作/实景拍摄/场景人物"
  1887. },
  1888. "source_nodes": [
  1889. "实物呈现"
  1890. ],
  1891. "source_posts": [
  1892. "66f51b90000000002a036660",
  1893. "6732cd8a000000001b02f948",
  1894. "677b5460000000000b00d33e",
  1895. "68a4107f000000001c00e8e9",
  1896. "68abe632000000001c0348c0",
  1897. "6913cafd000000000703402b",
  1898. "69647323000000001a01ef60"
  1899. ],
  1900. "matched_capabilities": [
  1901. "CAP-001",
  1902. "CAP-003",
  1903. "CAP-006",
  1904. "CAP-016"
  1905. ],
  1906. "capability_combination": "CAP-001(文本到图像生成)通过提示词描述物品特写、陈列方式、干净构图和产品展示风格生成基础图像,利用 Nano Banana Pro 或 FLUX.2 [max] 的照片级真实感能力;CAP-003(图像主体一致性保持)在有参考物品图时,确保生成图中物品外观与参考图一致;CAP-016(生成阶段原生高分辨率输出)直接输出高分辨率图像使物品细节清晰可辨;CAP-006(图像细节增强与高清放大)对物品纹理、材质等细节进行后期增强。",
  1907. "match_status": "完全满足",
  1908. "needs_research": false,
  1909. "research_note": ""
  1910. },
  1911. {
  1912. "requirement_id": "REQ_004",
  1913. "requirement_text": "生成带有特定道具装扮的人物场景图,道具需与人物自然融合,例如猫咪戴假发穿衣服手持书本、人物手持购物篮抱着玩偶玩具等,道具细节清晰可辨",
  1914. "source_subtree": {
  1915. "parent_node": "符号元素",
  1916. "parent_id": 15913,
  1917. "context_path": "/root/呈现/视觉/形象塑造/符号元素"
  1918. },
  1919. "source_nodes": [
  1920. "道具布景"
  1921. ],
  1922. "source_posts": [
  1923. "65febd8e0000000012035538",
  1924. "67e37ff8000000001c008b5e",
  1925. "682a8f11000000002002a511",
  1926. "6882f593000000001100272d",
  1927. "69535514000000001e032b26",
  1928. "6960e87a000000000e00c216"
  1929. ],
  1930. "matched_capabilities": [
  1931. "CAP-001",
  1932. "CAP-003"
  1933. ],
  1934. "capability_combination": "CAP-001(文本到图像生成)通过详细提示词描述人物与道具的组合场景(如猫咪戴假发穿衣服手持书本),直接生成包含道具的人物场景图;CAP-003(图像主体一致性保持)可在需要保持特定角色/动物外观一致的情况下,以参考图为输入确保主体特征稳定,同时通过提示词控制道具细节的清晰呈现。两者结合可满足道具与人物自然融合的需求。",
  1935. "match_status": "需要调研",
  1936. "needs_research": true,
  1937. "research_note": "现有 CAP-001 可通过提示词生成人物+道具场景,CAP-003 可保持主体一致性,但对于道具与人物的精确空间融合(如手持、穿戴等接触关系的自然度)以及道具细节的精确可辨性,现有能力描述中未明确说明能稳定实现复杂道具交互(如猫咪手持书本、人物抱玩偶等非常规姿态下的道具融合)。需要调研:1)各文生图工具对复杂道具交互场景的实际生成质量;2)是否需要结合 CAP-002(姿态控制)来精确控制持握姿态;3)道具细节清晰度在不同工具下的表现差异。"
  1938. },
  1939. {
  1940. "requirement_id": "REQ_005",
  1941. "requirement_text": "生成婚礼或节日庆典场景,背景需包含大量花卉装饰、定制发光字牌、喜字等布景元素,整体氛围感强烈,道具与场景协调统一",
  1942. "source_subtree": {
  1943. "parent_node": "符号元素",
  1944. "parent_id": 15913,
  1945. "context_path": "/root/呈现/视觉/形象塑造/符号元素"
  1946. },
  1947. "source_nodes": [
  1948. "道具布景"
  1949. ],
  1950. "source_posts": [
  1951. "65febd8e0000000012035538",
  1952. "67e37ff8000000001c008b5e",
  1953. "682a8f11000000002002a511",
  1954. "6882f593000000001100272d",
  1955. "69535514000000001e032b26",
  1956. "6960e87a000000000e00c216"
  1957. ],
  1958. "matched_capabilities": [
  1959. "CAP-001",
  1960. "CAP-014"
  1961. ],
  1962. "capability_combination": "CAP-001(文本到图像生成)通过详细提示词描述婚礼/庆典场景的整体氛围、花卉装饰、布景元素等,生成氛围感强烈的场景图;CAP-014(图像内文字渲染)负责在场景中准确渲染发光字牌上的定制文字、喜字等文字元素,确保文字清晰可读且与场景风格融合。两者结合可覆盖场景氛围生成与文字元素渲染的需求。",
  1963. "match_status": "需要调研",
  1964. "needs_research": true,
  1965. "research_note": "现有 CAP-001 可生成婚礼庆典整体场景,CAP-014 可渲染文字元素,但存在以下不确定性:1)大量花卉装饰的密集布景细节在 AI 生成中容易出现混乱或失真,现有能力未明确说明对复杂密集装饰场景的生成质量;2)定制发光字牌需要同时实现文字准确渲染+发光效果+与场景光照协调,CAP-014 侧重文字准确性,发光效果的物理自洽性未有明确说明;3)喜字等中文特殊字符的渲染准确性需确认(Nano Banana Pro 支持中文,但其他工具需验证)。需要调研:各工具对密集装饰场景和发光文字效果的实际生成能力。"
  1966. },
  1967. {
  1968. "requirement_id": "REQ_006",
  1969. "requirement_text": "生成精致室内空间场景,画面中需呈现陶瓷器皿、绿植、家具等道具摆件,光线自然柔和,营造出温馨生活感或高颜值家居氛围",
  1970. "source_subtree": {
  1971. "parent_node": "符号元素",
  1972. "parent_id": 15913,
  1973. "context_path": "/root/呈现/视觉/形象塑造/符号元素"
  1974. },
  1975. "source_nodes": [
  1976. "道具布景"
  1977. ],
  1978. "source_posts": [
  1979. "65febd8e0000000012035538",
  1980. "67e37ff8000000001c008b5e",
  1981. "682a8f11000000002002a511",
  1982. "6882f593000000001100272d",
  1983. "69535514000000001e032b26",
  1984. "6960e87a000000000e00c216"
  1985. ],
  1986. "matched_capabilities": [
  1987. "CAP-001",
  1988. "CAP-016"
  1989. ],
  1990. "capability_combination": "CAP-001(文本到图像生成)通过详细提示词描述室内场景构成(陶瓷器皿、绿植、家具摆件)、光线质感(自然柔和)和整体氛围(温馨/高颜值家居),直接生成目标场景图;CAP-016(生成阶段原生高分辨率输出)确保陶瓷纹理、植物叶片、家具材质等道具细节在原生输出阶段即清晰呈现,无需后期放大处理,提升精致感。",
  1991. "match_status": "完全满足",
  1992. "needs_research": false,
  1993. "research_note": ""
  1994. },
  1995. {
  1996. "requirement_id": "REQ_043",
  1997. "requirement_text": "在图片上叠加标题文字,文字大小、粗细、颜色各异,形成层次感强的排版效果——例如大标题用粗体醒目字体,副标题用细体小字,整体风格统一(如深色系商务风或简约设计风)",
  1998. "source_subtree": {
  1999. "parent_node": "字体标题",
  2000. "parent_id": 15899,
  2001. "context_path": "/root/呈现/视觉/构图编排/版面设计/字体标题"
  2002. },
  2003. "source_nodes": [
  2004. "基础文字",
  2005. "字体装饰"
  2006. ],
  2007. "source_posts": [
  2008. "65eea166000000000d00c6d8",
  2009. "65f4359b00000000140079b5",
  2010. "66619827000000000600486f",
  2011. "68f988f2000000000703ada5",
  2012. "693d0b1d000000001e02ba36",
  2013. "6960924b000000001a037a1c"
  2014. ],
  2015. "matched_capabilities": [
  2016. "CAP-014"
  2017. ],
  2018. "capability_combination": "CAP-014 支持在生成图像中嵌入文字内容,Nano Banana Pro 支持复杂排版布局和多语言高保真文本渲染,可在生成阶段直接输出含层次化排版文字的图像",
  2019. "match_status": "需要调研",
  2020. "needs_research": true,
  2021. "research_note": "CAP-014 支持在生成图像中渲染文字,但其核心场景是将文字作为图像内容的一部分自然融合(如产品标签、Logo),而本需求是在已有图片上叠加多层次排版文字(大标题粗体+副标题细体,颜色各异,形成设计感排版)。现有能力缺少:1)对已有图片进行后期文字叠加合成的能力;2)精确控制字体粗细、大小、颜色等排版参数的能力;3)多层次文字排版布局的精确控制。需要调研是否有专门的图文排版合成工具(如 Canva API、Adobe Express、或 ComfyUI 中的文字叠加节点)能够在已有图片上精确叠加多层次排版文字。"
  2022. },
  2023. {
  2024. "requirement_id": "REQ_044",
  2025. "requirement_text": "在AI生成的卡通角色图片上叠加幽默吐槽文案,文字直接覆盖在图片上方,字体简洁白色,与画面情绪呼应,形成图文结合的表情包风格内容",
  2026. "source_subtree": {
  2027. "parent_node": "字体标题",
  2028. "parent_id": 15899,
  2029. "context_path": "/root/呈现/视觉/构图编排/版面设计/字体标题"
  2030. },
  2031. "source_nodes": [
  2032. "基础文字",
  2033. "字体装饰"
  2034. ],
  2035. "source_posts": [
  2036. "65eea166000000000d00c6d8",
  2037. "65f4359b00000000140079b5",
  2038. "66619827000000000600486f",
  2039. "68f988f2000000000703ada5",
  2040. "693d0b1d000000001e02ba36",
  2041. "6960924b000000001a037a1c"
  2042. ],
  2043. "matched_capabilities": [
  2044. "CAP-001",
  2045. "CAP-014"
  2046. ],
  2047. "capability_combination": "CAP-001 可生成卡通角色图片,CAP-014 支持在图像中渲染文字内容",
  2048. "match_status": "需要调研",
  2049. "needs_research": true,
  2050. "research_note": "CAP-001 可生成卡通角色图片,CAP-014 可在生成阶段嵌入文字,但本需求的核心是在已有AI生成图片上叠加文字(表情包制作流程),需要精确控制文字位置(如图片顶部/底部)、字体样式(简洁白色)、文字与图片的层叠关系。现有能力缺少:1)对已有图片进行文字后期叠加合成的专项能力;2)精确控制文字在图片特定位置覆盖的能力;3)表情包标准排版格式(如顶部+底部文字)的支持。需要调研支持图片+文字合成的工具,如 ComfyUI 中是否有文字叠加节点、或专门的表情包生成工具。"
  2051. },
  2052. {
  2053. "requirement_id": "REQ_045",
  2054. "requirement_text": "制作多宫格拼图帖子,每格图片配有对应的标题文字或字幕说明,文字风格统一,整体排列整齐,适合用于周记、日历、流程说明等系列内容展示",
  2055. "source_subtree": {
  2056. "parent_node": "字体标题",
  2057. "parent_id": 15899,
  2058. "context_path": "/root/呈现/视觉/构图编排/版面设计/字体标题"
  2059. },
  2060. "source_nodes": [
  2061. "基础文字",
  2062. "字体装饰"
  2063. ],
  2064. "source_posts": [
  2065. "65eea166000000000d00c6d8",
  2066. "65f4359b00000000140079b5",
  2067. "66619827000000000600486f",
  2068. "68f988f2000000000703ada5",
  2069. "693d0b1d000000001e02ba36",
  2070. "6960924b000000001a037a1c"
  2071. ],
  2072. "matched_capabilities": [
  2073. "CAP-001",
  2074. "CAP-008",
  2075. "CAP-014"
  2076. ],
  2077. "capability_combination": "CAP-001 生成各格图片内容,CAP-008 批量生成多张图片,CAP-014 在每张图片中渲染对应文字说明",
  2078. "match_status": "需要调研",
  2079. "needs_research": true,
  2080. "research_note": "现有能力可以批量生成多张图片并在图像中渲染文字,但本需求的核心是将多张图片+文字组合成多宫格排版布局(整体排列整齐、统一风格的拼图帖子)。现有能力缺少:1)多图拼接/网格布局合成能力(将多张图片按宫格排列组合为一张完整图片);2)跨多格统一文字排版风格的控制;3)整体版面设计和对齐的能力。需要调研支持多图网格拼接合成的工具,如 ComfyUI 中的图像拼接节点、或专门的排版合成工具(Canva、图文排版API等)是否能实现多宫格布局合成。"
  2081. },
  2082. {
  2083. "requirement_id": "REQ_072",
  2084. "requirement_text": "给同一张猫咪照片批量添加不同职业的帽子、道具和配件(如厨师帽、安全帽、眼镜、画板等),让猫咪看起来像在扮演各种职业角色",
  2085. "source_subtree": {
  2086. "parent_node": "图像合成",
  2087. "parent_id": 15898,
  2088. "context_path": "/root/呈现/视觉/影像制作/后期处理/图像合成/图像合成"
  2089. },
  2090. "source_nodes": [
  2091. "抠图处理",
  2092. "拼贴融合",
  2093. "图层叠加"
  2094. ],
  2095. "source_posts": [
  2096. "66c5b638000000001d018e5a",
  2097. "66daeddb000000002603ea42",
  2098. "677b5460000000000b00d33e",
  2099. "6874c80e000000000d027767",
  2100. "691d3112000000001e036559",
  2101. "6964be3900000000210282a4"
  2102. ],
  2103. "matched_capabilities": [
  2104. "CAP-003",
  2105. "CAP-008",
  2106. "CAP-012"
  2107. ],
  2108. "capability_combination": "CAP-003(图像主体一致性保持)确保猫咪外观在所有版本中保持一致;CAP-012(图像局部重绘)在猫咪头部/手部区域局部重绘添加不同职业道具;CAP-008(批量图像生成)批量循环生成多个职业版本,每次切换不同道具提示词自动输出",
  2109. "match_status": "需要调研",
  2110. "needs_research": true,
  2111. "research_note": "现有能力可实现主体一致性保持(CAP-003)和局部重绘(CAP-012),但核心缺口在于:将外部素材(帽子、道具等配件图片)精准叠加/融合到猫咪照片特定位置的能力——即传统意义上的'抠图+拼贴融合'。原子能力表中没有明确的'前景素材抠图与精准位置合成'能力。需要调研:1)AI工具是否支持将用户提供的配件素材图抠图后精准合成到指定主体位置;2)ComfyUI是否有专用的图像合成/蒙版叠加节点可实现此类配件叠加;3)是否可通过局部重绘(CAP-012)结合参考图完全替代传统抠图拼贴流程"
  2112. },
  2113. {
  2114. "requirement_id": "REQ_073",
  2115. "requirement_text": "将真实照片转换成具有统一色调风格的插画效果,整体呈现蓝紫色调的复古油画或动画风格,让风景场景看起来像艺术插图",
  2116. "source_subtree": {
  2117. "parent_node": "图像合成",
  2118. "parent_id": 15898,
  2119. "context_path": "/root/呈现/视觉/影像制作/后期处理/图像合成/图像合成"
  2120. },
  2121. "source_nodes": [
  2122. "风格化处理",
  2123. "AI生成合成"
  2124. ],
  2125. "source_posts": [
  2126. "66c5b638000000001d018e5a",
  2127. "66daeddb000000002603ea42",
  2128. "677b5460000000000b00d33e",
  2129. "6874c80e000000000d027767",
  2130. "691d3112000000001e036559",
  2131. "6964be3900000000210282a4"
  2132. ],
  2133. "matched_capabilities": [
  2134. "CAP-004",
  2135. "CAP-012"
  2136. ],
  2137. "capability_combination": "CAP-004(风格切换与风格控制)是核心能力:通过加载油画/动画风格LoRA(ComfyUI)或使用--sref上传蓝紫色调复古风格参考图(Midjourney v8),将输入的真实风景照片渲染为目标艺术风格;CAP-012可辅助对特定区域进行风格化局部调整以确保色调统一",
  2138. "match_status": "完全满足",
  2139. "needs_research": false,
  2140. "research_note": ""
  2141. },
  2142. {
  2143. "requirement_id": "REQ_074",
  2144. "requirement_text": "制作图文排版信息图,将多张食材产品图片抠出后整齐排列在统一背景上,配合文字说明组合成内容丰富的科普海报",
  2145. "source_subtree": {
  2146. "parent_node": "图像合成",
  2147. "parent_id": 15898,
  2148. "context_path": "/root/呈现/视觉/影像制作/后期处理/图像合成/图像合成"
  2149. },
  2150. "source_nodes": [
  2151. "抠图处理",
  2152. "拼贴融合",
  2153. "图层叠加"
  2154. ],
  2155. "source_posts": [
  2156. "66c5b638000000001d018e5a",
  2157. "66daeddb000000002603ea42",
  2158. "677b5460000000000b00d33e",
  2159. "6874c80e000000000d027767",
  2160. "691d3112000000001e036559",
  2161. "6964be3900000000210282a4"
  2162. ],
  2163. "matched_capabilities": [
  2164. "CAP-014",
  2165. "CAP-001"
  2166. ],
  2167. "capability_combination": "CAP-014(图像内文字渲染)支持在生成图像中嵌入清晰可读的文字说明;CAP-001(文本到图像生成)可生成带有整体排版布局的科普海报底图",
  2168. "match_status": "需要调研",
  2169. "needs_research": true,
  2170. "research_note": "需求的核心流程是:将多张已有食材产品图片抠图去背景→整齐排列到统一背景→配合文字组合为海报。原子能力表中明显缺少:1)'图像抠图/背景移除'能力——将现有产品照片的背景去除,原子能力表中无此专项能力;2)'多图像精准位置排版合成'能力——将多张抠好的素材按网格/指定位置整齐拼排到统一背景上,这与CAP-020(多主体场景合成)侧重角色一致性不同,此处需要的是像素级排版控制。需要调研:1)AI工具中是否有专用的背景移除/抠图工具(如Remove.bg集成、ComfyUI的BiRefNet/REMBG节点);2)是否有支持多图精准网格排版合成的AI能力;3)Nano Banana Pro的多图输入(CAP-020)是否能满足'整齐排列'的排版控制需求"
  2171. },
  2172. {
  2173. "requirement_id": "REQ_082",
  2174. "requirement_text": "对同一场景或主体生成多个不同距离和景别的画面,包括远景展示整体环境、中景呈现主体与环境关系、近景突出细节,形成一组视角丰富的图片集合",
  2175. "source_subtree": {
  2176. "parent_node": "视角选择",
  2177. "parent_id": 15895,
  2178. "context_path": "/root/呈现/视觉/构图编排/空间布局/景别角度/视角选择"
  2179. },
  2180. "source_nodes": [
  2181. "多角度呈现",
  2182. "全景广角"
  2183. ],
  2184. "source_posts": [
  2185. "648d8edf0000000011013447",
  2186. "6774ab9a0000000009015a3f",
  2187. "68538f7c000000002400805b",
  2188. "685f974300000000120144db",
  2189. "692d3b99000000001e022295",
  2190. "6960e87a000000000e00c216"
  2191. ],
  2192. "matched_capabilities": [
  2193. "CAP-001",
  2194. "CAP-008"
  2195. ],
  2196. "capability_combination": "CAP-001(文本到图像生成)通过在提示词中分别描述远景/中景/近景的构图参数(如 'wide shot showing full environment'、'medium shot showing subject and surroundings'、'close-up shot highlighting details')生成不同景别的图像;CAP-008(批量图像生成)可在单次工作流中批量生成多张不同景别的图像,形成完整图片集合。两者组合可完整实现该需求。",
  2197. "match_status": "完全满足",
  2198. "needs_research": false,
  2199. "research_note": ""
  2200. },
  2201. {
  2202. "requirement_id": "REQ_083",
  2203. "requirement_text": "生成采用非常规拍摄角度的图片,如从低角度仰拍、从高处俯视、或模拟第一人称主观视角看向场景,让画面产生独特的视觉冲击感",
  2204. "source_subtree": {
  2205. "parent_node": "视角选择",
  2206. "parent_id": 15895,
  2207. "context_path": "/root/呈现/视觉/构图编排/空间布局/景别角度/视角选择"
  2208. },
  2209. "source_nodes": [
  2210. "特殊视角",
  2211. "多角度呈现"
  2212. ],
  2213. "source_posts": [
  2214. "648d8edf0000000011013447",
  2215. "6774ab9a0000000009015a3f",
  2216. "68538f7c000000002400805b",
  2217. "685f974300000000120144db",
  2218. "692d3b99000000001e022295",
  2219. "6960e87a000000000e00c216"
  2220. ],
  2221. "matched_capabilities": [
  2222. "CAP-001"
  2223. ],
  2224. "capability_combination": "CAP-001(文本到图像生成)通过在提示词中明确描述特殊视角参数(如 'low angle shot looking up'、'bird's eye view from above'、'first person perspective'、'worm's eye view')即可引导模型生成对应非常规角度的图像。Midjourney v8、FLUX.2 [max]、Nano Banana Pro 等工具均对摄影构图提示词有良好的遵循性,可直接实现仰拍、俯视、主观视角等效果。",
  2225. "match_status": "完全满足",
  2226. "needs_research": false,
  2227. "research_note": ""
  2228. },
  2229. {
  2230. "requirement_id": "REQ_084",
  2231. "requirement_text": "生成能展示宽广空间感的室内或室外全景图,画面中包含完整的环境纵深,让观看者感受到场景的整体规模和空间层次",
  2232. "source_subtree": {
  2233. "parent_node": "视角选择",
  2234. "parent_id": 15895,
  2235. "context_path": "/root/呈现/视觉/构图编排/空间布局/景别角度/视角选择"
  2236. },
  2237. "source_nodes": [
  2238. "全景广角",
  2239. "特殊视角"
  2240. ],
  2241. "source_posts": [
  2242. "648d8edf0000000011013447",
  2243. "6774ab9a0000000009015a3f",
  2244. "68538f7c000000002400805b",
  2245. "685f974300000000120144db",
  2246. "692d3b99000000001e022295",
  2247. "6960e87a000000000e00c216"
  2248. ],
  2249. "matched_capabilities": [
  2250. "CAP-001",
  2251. "CAP-016"
  2252. ],
  2253. "capability_combination": "CAP-001(文本到图像生成)通过提示词描述广角全景构图(如 'wide angle panoramic view'、'ultra-wide shot with deep perspective'、'expansive interior with full depth of field')生成具有空间纵深感的全景图;CAP-016(生成阶段原生高分辨率输出)可配合使用宽幅宽高比输出(如 Midjourney v8 支持最大 4:1 宽高比的 HD 模式,Nano Banana Pro 支持 21:9 宽高比),使全景图在宽幅画面中更完整地呈现空间层次和整体规模。",
  2254. "match_status": "完全满足",
  2255. "needs_research": false,
  2256. "research_note": ""
  2257. },
  2258. {
  2259. "requirement_id": "REQ_094",
  2260. "requirement_text": "生成具有强烈戏剧性光影对比的户外场景图,画面中光源方向明确(如侧光或逆光),亮部与暗部之间形成鲜明反差,阴影轮廓清晰,整体呈现出电影感或艺术摄影风格的视觉张力",
  2261. "source_subtree": {
  2262. "parent_node": "光影表现",
  2263. "parent_id": 15936,
  2264. "context_path": "/root/呈现/视觉/影像制作/后期处理/画质优化/光影质感/光影表现"
  2265. },
  2266. "source_nodes": [
  2267. "明暗对比",
  2268. "光源特征"
  2269. ],
  2270. "source_posts": [
  2271. "665971bb000000001303d005",
  2272. "681c64ce000000002200554c",
  2273. "68946e0d000000002500ef6e",
  2274. "692a535f0000000019026d5b",
  2275. "692cc7ab000000001b030110",
  2276. "6973742d000000002801e8aa"
  2277. ],
  2278. "matched_capabilities": [
  2279. "CAP-001",
  2280. "CAP-004"
  2281. ],
  2282. "capability_combination": "CAP-001(文本到图像生成)通过详细提示词描述侧光/逆光方向、强烈明暗对比、清晰阴影轮廓等光影特征直接生成目标图像;CAP-004(风格切换与风格控制)通过风格参数(如 Midjourney --stylize 或 --sref 风格参考图)进一步强化电影感或艺术摄影风格的视觉呈现,两者组合可完整实现该需求。",
  2283. "match_status": "完全满足",
  2284. "needs_research": false,
  2285. "research_note": ""
  2286. },
  2287. {
  2288. "requirement_id": "REQ_095",
  2289. "requirement_text": "生成室内暖光氛围图,画面中多个光源(吊灯、筒灯、窗外自然光)共同营造出温暖柔和的米色调空间,光线从不同方向照射,形成层次丰富的软阴影,整体氛围温馨舒适",
  2290. "source_subtree": {
  2291. "parent_node": "光影表现",
  2292. "parent_id": 15936,
  2293. "context_path": "/root/呈现/视觉/影像制作/后期处理/画质优化/光影质感/光影表现"
  2294. },
  2295. "source_nodes": [
  2296. "光源特征",
  2297. "氛围营造"
  2298. ],
  2299. "source_posts": [
  2300. "665971bb000000001303d005",
  2301. "681c64ce000000002200554c",
  2302. "68946e0d000000002500ef6e",
  2303. "692a535f0000000019026d5b",
  2304. "692cc7ab000000001b030110",
  2305. "6973742d000000002801e8aa"
  2306. ],
  2307. "matched_capabilities": [
  2308. "CAP-001",
  2309. "CAP-004"
  2310. ],
  2311. "capability_combination": "CAP-001(文本到图像生成)通过提示词详细描述多光源类型(吊灯、筒灯、窗外自然光)、暖色调、米色空间、软阴影层次等要素生成室内场景图;CAP-004(风格切换与风格控制)可通过风格参数或参考图进一步精准控制温馨舒适的整体氛围调性,两者组合可完整实现该需求。",
  2312. "match_status": "完全满足",
  2313. "needs_research": false,
  2314. "research_note": ""
  2315. },
  2316. {
  2317. "requirement_id": "REQ_096",
  2318. "requirement_text": "生成充满魔幻或超现实感的彩色光效场景,画面中有多种颜色的光线(如橙、蓝、紫等)交织流动,光源本身成为视觉焦点,整体营造出梦幻、神秘或节日感的强烈氛围",
  2319. "source_subtree": {
  2320. "parent_node": "光影表现",
  2321. "parent_id": 15936,
  2322. "context_path": "/root/呈现/视觉/影像制作/后期处理/画质优化/光影质感/光影表现"
  2323. },
  2324. "source_nodes": [
  2325. "氛围营造",
  2326. "光源特征"
  2327. ],
  2328. "source_posts": [
  2329. "665971bb000000001303d005",
  2330. "681c64ce000000002200554c",
  2331. "68946e0d000000002500ef6e",
  2332. "692a535f0000000019026d5b",
  2333. "692cc7ab000000001b030110",
  2334. "6973742d000000002801e8aa"
  2335. ],
  2336. "matched_capabilities": [
  2337. "CAP-001",
  2338. "CAP-004"
  2339. ],
  2340. "capability_combination": "CAP-001(文本到图像生成)通过提示词描述多色彩光线(橙、蓝、紫)交织流动、光源作为视觉焦点、超现实感等要素直接生成目标场景;CAP-004(风格切换与风格控制)通过 --stylize 参数提升风格化程度或使用 --sref 风格参考图强化梦幻/神秘/节日感的氛围表达,两者组合可完整实现该需求。",
  2341. "match_status": "完全满足",
  2342. "needs_research": false,
  2343. "research_note": ""
  2344. },
  2345. {
  2346. "requirement_id": "REQ_001",
  2347. "requirement_text": "生成人物在不同场景下呈现丰富面部表情的图片,例如夸张的痛苦、无奈、开心、困倦等神态,表情要生动传神、情绪感强烈",
  2348. "source_subtree": {
  2349. "parent_node": "人物表现",
  2350. "parent_id": 15912,
  2351. "context_path": "/root/呈现/视觉/形象塑造/人物表现"
  2352. },
  2353. "source_nodes": [
  2354. "表情神态",
  2355. "模拟扮演"
  2356. ],
  2357. "source_posts": [
  2358. "648d8edf0000000011013447",
  2359. "66619827000000000600486f",
  2360. "68946e0d000000002500ef6e",
  2361. "692d3b99000000001e022295",
  2362. "6960e87a000000000e00c216"
  2363. ],
  2364. "matched_capabilities": [
  2365. "CAP-001",
  2366. "CAP-003"
  2367. ],
  2368. "capability_combination": "CAP-001(文本到图像生成)通过详细的提示词描述目标表情和情绪(如夸张痛苦、无奈、开心、困倦等),直接生成对应神态的人物图像;CAP-003(图像主体一致性保持)在需要同一人物呈现多种表情时,以参考图为输入保持人物外观一致,仅通过提示词切换表情描述,批量生成不同场景下的表情系列图。",
  2369. "match_status": "完全满足",
  2370. "needs_research": false,
  2371. "research_note": ""
  2372. },
  2373. {
  2374. "requirement_id": "REQ_002",
  2375. "requirement_text": "生成人物与道具、环境或其他角色发生互动的画面,例如人物摆弄物品、与道具合影、在特定场景中做出配合动作等,画面要体现人物和周围元素之间的关联感",
  2376. "source_subtree": {
  2377. "parent_node": "人物表现",
  2378. "parent_id": 15912,
  2379. "context_path": "/root/呈现/视觉/形象塑造/人物表现"
  2380. },
  2381. "source_nodes": [
  2382. "互动协作",
  2383. "出镜展示"
  2384. ],
  2385. "source_posts": [
  2386. "648d8edf0000000011013447",
  2387. "66619827000000000600486f",
  2388. "68946e0d000000002500ef6e",
  2389. "692d3b99000000001e022295",
  2390. "6960e87a000000000e00c216"
  2391. ],
  2392. "matched_capabilities": [
  2393. "CAP-001",
  2394. "CAP-002",
  2395. "CAP-003",
  2396. "CAP-020"
  2397. ],
  2398. "capability_combination": "CAP-001(文本到图像生成)通过提示词详细描述人物与道具/环境/其他角色的互动动作和场景关系,直接生成互动画面;CAP-002(结构/姿态控制生成)通过姿态骨架约束人物与道具互动时的具体姿态,确保动作自然合理;CAP-003(图像主体一致性保持)在需要固定人物外观的前提下切换不同互动场景;CAP-020(多主体场景合成)在涉及多角色互动时,将多个角色参考图合成到同一场景中,体现角色间的关联感。",
  2399. "match_status": "完全满足",
  2400. "needs_research": false,
  2401. "research_note": ""
  2402. },
  2403. {
  2404. "requirement_id": "REQ_003",
  2405. "requirement_text": "生成将动物(如猫咪)拟人化扮演特定角色或情境的图片,赋予其人类的表情、姿态和道具,用来传达幽默或情感共鸣的视觉效果",
  2406. "source_subtree": {
  2407. "parent_node": "人物表现",
  2408. "parent_id": 15912,
  2409. "context_path": "/root/呈现/视觉/形象塑造/人物表现"
  2410. },
  2411. "source_nodes": [
  2412. "模拟扮演",
  2413. "侧面塑造"
  2414. ],
  2415. "source_posts": [
  2416. "648d8edf0000000011013447",
  2417. "66619827000000000600486f",
  2418. "68946e0d000000002500ef6e",
  2419. "692d3b99000000001e022295",
  2420. "6960e87a000000000e00c216"
  2421. ],
  2422. "matched_capabilities": [
  2423. "CAP-001",
  2424. "CAP-002",
  2425. "CAP-004"
  2426. ],
  2427. "capability_combination": "CAP-001(文本到图像生成)通过提示词描述动物拟人化的具体角色、情境、表情和道具(如「穿西装打领带、表情无奈的猫咪坐在办公桌前」),直接生成拟人化动物图像;CAP-002(结构/姿态控制生成)通过姿态骨架约束动物呈现人类姿态(如站立、坐姿、持物等),使拟人化效果更自然;CAP-004(风格切换与风格控制)通过风格参数或LoRA调整画面整体风格(如卡通、写实、插画),配合幽默或情感共鸣的视觉表达需求。",
  2428. "match_status": "完全满足",
  2429. "needs_research": false,
  2430. "research_note": ""
  2431. },
  2432. {
  2433. "requirement_id": "REQ_019",
  2434. "requirement_text": "将人物照片与中国传统吉祥符号(如双喜字、红玫瑰、金色祝福文字)融合,生成具有强烈喜庆氛围的定制化图案,人物面孔清晰嵌入红色喜庆背景中",
  2435. "source_subtree": {
  2436. "parent_node": "视觉符号",
  2437. "parent_id": 15902,
  2438. "context_path": "/root/呈现/视觉/形象塑造/符号元素/视觉符号"
  2439. },
  2440. "source_nodes": [
  2441. "图形图标",
  2442. "标识辨识",
  2443. "视觉意象"
  2444. ],
  2445. "source_posts": [
  2446. "6602bd07000000001203348c",
  2447. "67284f9c000000001901875a",
  2448. "68737e97000000000d027b81",
  2449. "68a8241a000000001c011403",
  2450. "68c15181000000001b01c358"
  2451. ],
  2452. "matched_capabilities": [
  2453. "CAP-003",
  2454. "CAP-014",
  2455. "CAP-001"
  2456. ],
  2457. "capability_combination": "CAP-003(图像主体一致性保持)以人物照片为参考图输入,保持人物面孔特征清晰嵌入生成图像;CAP-014(图像内文字渲染)负责在图像中渲染双喜字、金色祝福文字等中文文字元素;CAP-001(文本到图像生成)通过提示词描述红色喜庆背景、红玫瑰、吉祥符号等视觉元素,生成整体喜庆氛围图案;三者组合可实现人物面孔与传统吉祥符号融合的定制化喜庆图案",
  2458. "match_status": "需要调研",
  2459. "needs_research": true,
  2460. "research_note": "现有能力组合(CAP-003+CAP-014+CAP-001)可以覆盖人物面孔保持、文字渲染和喜庆背景生成,但存在关键缺口:双喜字、吉祥纹样等中国传统图形符号属于复杂装饰性图形元素,需要确认现有工具对中国传统纹样图形的生成精准度;同时人物面孔与复杂装饰性背景的自然融合(非简单叠加)效果需要调研,特别是面孔清晰嵌入红色喜庆背景时的边缘融合质量。需调研方向:1)Nano Banana Pro 或 FLUX.2 [max] 对中国传统吉祥纹样图形的生成准确度;2)人物照片与装饰性背景深度融合(非换背景)的实现方式"
  2461. },
  2462. {
  2463. "requirement_id": "REQ_020",
  2464. "requirement_text": "制作统一模板风格的系列信息卡片,每张卡片包含固定的图标符号(如皇冠等级图标)、彩色标题文字和配图,整体视觉风格一致、可批量复用",
  2465. "source_subtree": {
  2466. "parent_node": "视觉符号",
  2467. "parent_id": 15902,
  2468. "context_path": "/root/呈现/视觉/形象塑造/符号元素/视觉符号"
  2469. },
  2470. "source_nodes": [
  2471. "图形图标",
  2472. "标识辨识"
  2473. ],
  2474. "source_posts": [
  2475. "6602bd07000000001203348c",
  2476. "67284f9c000000001901875a",
  2477. "68737e97000000000d027b81",
  2478. "68a8241a000000001c011403",
  2479. "68c15181000000001b01c358"
  2480. ],
  2481. "matched_capabilities": [
  2482. "CAP-001",
  2483. "CAP-014",
  2484. "CAP-004",
  2485. "CAP-008"
  2486. ],
  2487. "capability_combination": "CAP-001(文本到图像生成)生成每张卡片的配图内容;CAP-014(图像内文字渲染)在卡片中渲染彩色标题文字;CAP-004(风格切换与风格控制)通过统一风格参数或LoRA确保系列卡片视觉风格一致;CAP-008(批量图像生成)实现系列卡片的批量自动化生产",
  2488. "match_status": "需要调研",
  2489. "needs_research": true,
  2490. "research_note": "现有能力可覆盖文字渲染、风格统一和批量生成,但存在关键缺口:固定图标符号(如皇冠等级图标)在每张卡片中需保持像素级一致的图形元素复用,现有能力表中没有明确支持「固定UI图标元素跨图复用」的能力——CAP-003主要针对人物/产品主体一致性,不专门针对图标符号的精确复用;此外卡片的整体排版布局(图标位置固定、文字区域固定、配图区域固定)属于模板化排版能力,现有能力表未明确覆盖。需调研方向:1)AI图像生成工具是否支持基于固定排版模板的卡片生成(如锁定图标位置和尺寸);2)图标符号跨批次精确复用的实现方式(是否需要结合图像合成/后处理工具)"
  2491. },
  2492. {
  2493. "requirement_id": "REQ_021",
  2494. "requirement_text": "生成黑色科技感背景的人物宣传海报,背景带有流光线条或霓虹光效,人物照片与品牌Logo、活动标识、二维码等视觉元素整齐排布,形成高辨识度的系列展示图",
  2495. "source_subtree": {
  2496. "parent_node": "视觉符号",
  2497. "parent_id": 15902,
  2498. "context_path": "/root/呈现/视觉/形象塑造/符号元素/视觉符号"
  2499. },
  2500. "source_nodes": [
  2501. "标识辨识",
  2502. "视觉意象",
  2503. "图形图标"
  2504. ],
  2505. "source_posts": [
  2506. "6602bd07000000001203348c",
  2507. "67284f9c000000001901875a",
  2508. "68737e97000000000d027b81",
  2509. "68a8241a000000001c011403",
  2510. "68c15181000000001b01c358"
  2511. ],
  2512. "matched_capabilities": [
  2513. "CAP-003",
  2514. "CAP-001",
  2515. "CAP-004",
  2516. "CAP-014",
  2517. "CAP-008"
  2518. ],
  2519. "capability_combination": "CAP-003(图像主体一致性保持)以人物照片为参考图保持人物外观特征;CAP-001(文本到图像生成)通过提示词描述黑色科技感背景、流光线条、霓虹光效等视觉元素;CAP-004(风格切换与风格控制)确保系列海报视觉风格统一;CAP-014(图像内文字渲染)渲染海报中的文字信息;CAP-008(批量图像生成)实现系列展示图的批量生产",
  2520. "match_status": "需要调研",
  2521. "needs_research": true,
  2522. "research_note": "现有能力可覆盖人物保持、科技感背景生成和系列风格统一,但存在关键缺口:1)品牌Logo、活动标识、二维码等精确图形元素需要以像素精确的方式嵌入海报指定位置,特别是二维码必须保持可扫描的精确图形,AI图像生成工具通常无法保证二维码等精确图形的像素级准确复现;2)多视觉元素(人物+Logo+标识+二维码)在海报中的「整齐排布」涉及精确的版式布局控制,现有能力表未明确覆盖版式/排版精确控制能力。需调研方向:1)AI工具是否支持将外部精确图形(Logo、二维码)以指定位置和尺寸嵌入生成图像(类似图层合成);2)是否需要结合设计工具(如Figma、PS)进行后期精确排版合成,而非纯AI生成"
  2523. },
  2524. {
  2525. "requirement_id": "REQ_025",
  2526. "requirement_text": "生成穿着完整冬季搭配的人物形象,展示黑色羽绒服、红色围巾、红色手套、宽腿裤等单品的组合穿搭效果,呈现从全身到局部细节的多角度造型展示",
  2527. "source_subtree": {
  2528. "parent_node": "穿搭呈现",
  2529. "parent_id": 15893,
  2530. "context_path": "/root/呈现/视觉/形象塑造/造型装扮/穿搭呈现"
  2531. },
  2532. "source_nodes": [
  2533. "搭配手法",
  2534. "整体形象",
  2535. "细节修饰"
  2536. ],
  2537. "source_posts": [
  2538. "66daeddb000000002603ea42",
  2539. "67b2a7f7000000002802a0d7",
  2540. "681c64ce000000002200554c",
  2541. "68ca143d000000001202c3de",
  2542. "6960e87a000000000e00c216"
  2543. ],
  2544. "matched_capabilities": [
  2545. "CAP-001",
  2546. "CAP-002",
  2547. "CAP-016"
  2548. ],
  2549. "capability_combination": "CAP-001(文本到图像生成)通过详细提示词描述服装单品组合生成人物穿搭图;CAP-002(结构/姿态控制生成)通过ControlNet控制人物姿态,实现全身正面、侧面、局部特写等多角度构图;CAP-016(生成阶段原生高分辨率输出)确保服装面料纹理、围巾编织细节等局部细节清晰可见",
  2550. "match_status": "完全满足",
  2551. "needs_research": false,
  2552. "research_note": ""
  2553. },
  2554. {
  2555. "requirement_id": "REQ_026",
  2556. "requirement_text": "生成宠物穿着服装的可爱造型图,展示猫咪穿上印花连体衣的整体穿着效果,需要清晰呈现服装的图案、版型与宠物身体的贴合细节",
  2557. "source_subtree": {
  2558. "parent_node": "穿搭呈现",
  2559. "parent_id": 15893,
  2560. "context_path": "/root/呈现/视觉/形象塑造/造型装扮/穿搭呈现"
  2561. },
  2562. "source_nodes": [
  2563. "整体形象",
  2564. "细节修饰"
  2565. ],
  2566. "source_posts": [
  2567. "66daeddb000000002603ea42",
  2568. "67b2a7f7000000002802a0d7",
  2569. "681c64ce000000002200554c",
  2570. "68ca143d000000001202c3de",
  2571. "6960e87a000000000e00c216"
  2572. ],
  2573. "matched_capabilities": [
  2574. "CAP-001",
  2575. "CAP-016"
  2576. ],
  2577. "capability_combination": "CAP-001(文本到图像生成)通过提示词描述猫咪穿着印花连体衣的造型生成图像;CAP-016(生成阶段原生高分辨率输出)确保印花图案细节、服装与猫咪身体贴合的版型细节清晰呈现",
  2578. "match_status": "需要调研",
  2579. "needs_research": true,
  2580. "research_note": "CAP-001可以生成宠物穿衣图像,CAP-016可保障细节清晰度,但核心难点在于:猫咪体型特殊(四肢短、身体圆润),AI生成宠物穿衣图像时服装贴合度、版型准确性难以保证,且印花图案在弯曲身体上的透视变形效果是否能准确呈现存疑。需要调研:1)现有文生图工具对宠物穿衣场景的实际生成质量;2)是否有专门针对宠物服装展示的LoRA或微调模型;3)CAP-003(主体一致性)结合真实猫咪参考图是否能提升服装贴合细节的准确性"
  2581. },
  2582. {
  2583. "requirement_id": "REQ_027",
  2584. "requirement_text": "生成创意合成图,将人物穿搭形象嵌入特定场景容器中(如超市生鲜托盘),使人物服装与场景产生趣味性视觉对比,同时保留服装细节的清晰可见",
  2585. "source_subtree": {
  2586. "parent_node": "穿搭呈现",
  2587. "parent_id": 15893,
  2588. "context_path": "/root/呈现/视觉/形象塑造/造型装扮/穿搭呈现"
  2589. },
  2590. "source_nodes": [
  2591. "搭配手法",
  2592. "整体形象"
  2593. ],
  2594. "source_posts": [
  2595. "66daeddb000000002603ea42",
  2596. "67b2a7f7000000002802a0d7",
  2597. "681c64ce000000002200554c",
  2598. "68ca143d000000001202c3de",
  2599. "6960e87a000000000e00c216"
  2600. ],
  2601. "matched_capabilities": [
  2602. "CAP-001",
  2603. "CAP-003"
  2604. ],
  2605. "capability_combination": "CAP-001(文本到图像生成)通过提示词描述人物被置于超市生鲜托盘等容器场景中的创意合成画面;CAP-003(图像主体一致性保持)以人物穿搭参考图为输入,确保嵌入场景后服装外观特征保持一致",
  2606. "match_status": "需要调研",
  2607. "needs_research": true,
  2608. "research_note": "CAP-001可尝试通过提示词直接描述此类创意合成场景,CAP-003可保持人物服装一致性,但核心难点在于:将人物精确嵌入特定容器(如托盘)并产生视觉上合理的比例关系、透视关系和边界融合,属于复杂的空间合成任务,单纯文生图难以精确控制人物与容器的嵌套关系。需要调研:1)CAP-012(图像局部重绘)是否可先生成场景容器再将人物重绘嵌入;2)CAP-020(多主体场景合成)能否将人物与容器场景合成;3)是否需要结合CAP-002(姿态控制)约束人物在容器内的姿态和比例;4)现有工具对此类超现实创意合成的实际效果评估"
  2609. },
  2610. {
  2611. "requirement_id": "REQ_031",
  2612. "requirement_text": "将真实照片中的人物与卡通/奇幻元素合成,例如给人物添加蟑螂的触角和腿,使人物看起来像变成了一只蟑螂,整体画面自然融合不突兀",
  2613. "source_subtree": {
  2614. "parent_node": "画质优化",
  2615. "parent_id": 15884,
  2616. "context_path": "/root/呈现/视觉/影像制作/后期处理/画质优化"
  2617. },
  2618. "source_nodes": [
  2619. "后期加工",
  2620. "画质优化"
  2621. ],
  2622. "source_posts": [
  2623. "67e68c9d00000000060282fb",
  2624. "68077d02000000001c02dd81",
  2625. "682ede8f000000002202bff2",
  2626. "683d8695000000001200012a",
  2627. "68d610800000000012023282"
  2628. ],
  2629. "matched_capabilities": [
  2630. "CAP-012"
  2631. ],
  2632. "capability_combination": "CAP-012 可以对真实照片进行局部重绘,在指定区域添加蟑螂触角、腿等元素,但核心挑战在于将卡通/奇幻元素与真实照片自然融合,且需要精确控制添加元素的位置和形态",
  2633. "match_status": "需要调研",
  2634. "needs_research": true,
  2635. "research_note": "CAP-012(图像局部重绘)可以在指定区域添加新元素,但该需求的核心难点是:1)将卡通风格的蟑螂元素(触角、腿)与真实人物照片自然融合,涉及跨风格合成(写实+卡通);2)需要精确控制添加元素的位置(如头顶添加触角、身体两侧添加腿)并保持透视和光照一致;3)现有能力表中没有明确支持'真实照片+卡通元素跨风格自然融合'的专项能力。需要调研:AI图像编辑工具是否支持将卡通/手绘风格元素与写实照片无缝合成、是否有专门的图像合成/图层融合能力。"
  2636. },
  2637. {
  2638. "requirement_id": "REQ_032",
  2639. "requirement_text": "给普通猫咪照片套上不同职业的服装和场景(如医生、上班族、老板等),并保持猫咪面部表情清晰可辨,制作出系列表情包拼贴图",
  2640. "source_subtree": {
  2641. "parent_node": "画质优化",
  2642. "parent_id": 15884,
  2643. "context_path": "/root/呈现/视觉/影像制作/后期处理/画质优化"
  2644. },
  2645. "source_nodes": [
  2646. "后期加工",
  2647. "画质优化"
  2648. ],
  2649. "source_posts": [
  2650. "67e68c9d00000000060282fb",
  2651. "68077d02000000001c02dd81",
  2652. "682ede8f000000002202bff2",
  2653. "683d8695000000001200012a",
  2654. "68d610800000000012023282"
  2655. ],
  2656. "matched_capabilities": [
  2657. "CAP-003",
  2658. "CAP-012",
  2659. "CAP-008",
  2660. "CAP-005"
  2661. ],
  2662. "capability_combination": "CAP-003 保持猫咪面部特征一致性,CAP-012 对猫咪照片进行局部重绘添加职业服装和场景背景,CAP-008 批量生成多个职业版本,CAP-005 确保猫咪面部表情清晰可辨;但拼贴图排版合成环节仍有缺口",
  2663. "match_status": "需要调研",
  2664. "needs_research": true,
  2665. "research_note": "现有能力可以做到:CAP-003保持猫咪外观一致性、CAP-012替换服装和背景、CAP-008批量生成系列图、CAP-005增强面部清晰度。缺少的能力:1)将多张生成图拼贴排版为表情包拼贴图的能力,原子能力表中没有图像拼贴/排版合成能力;2)猫咪穿着职业服装的合成效果是否自然(猫咪体型与人类服装的适配问题)需要验证。需要调研:AI工具是否支持多图拼贴排版输出,或是否有专门的表情包拼贴图生成能力。"
  2666. },
  2667. {
  2668. "requirement_id": "REQ_033",
  2669. "requirement_text": "在真实物体照片上叠加手绘风格的简笔画元素,例如在猕猴桃切片上添加卡通五官和小触角,让照片呈现出实物与手绘结合的趣味效果",
  2670. "source_subtree": {
  2671. "parent_node": "画质优化",
  2672. "parent_id": 15884,
  2673. "context_path": "/root/呈现/视觉/影像制作/后期处理/画质优化"
  2674. },
  2675. "source_nodes": [
  2676. "后期加工",
  2677. "画质优化"
  2678. ],
  2679. "source_posts": [
  2680. "67e68c9d00000000060282fb",
  2681. "68077d02000000001c02dd81",
  2682. "682ede8f000000002202bff2",
  2683. "683d8695000000001200012a",
  2684. "68d610800000000012023282"
  2685. ],
  2686. "matched_capabilities": [
  2687. "CAP-012"
  2688. ],
  2689. "capability_combination": "CAP-012 可以在真实物体照片的指定区域重绘添加新元素,但核心需求是在写实照片上叠加手绘/简笔画风格元素并保持风格差异(即手绘元素要看起来像手绘而非写实生成)",
  2690. "match_status": "需要调研",
  2691. "needs_research": true,
  2692. "research_note": "CAP-012(图像局部重绘)可以在照片上添加新元素,但该需求的核心难点是:1)添加的元素必须保持'手绘简笔画'风格,与写实照片形成明显的风格对比(而非融合),这与CAP-012默认追求'自然融合'的目标相反;2)需要精确控制新增元素的风格为手绘/卡通,同时保持原始照片区域不变;3)原子能力表中没有明确支持'在写实照片上叠加指定手绘风格元素'且保持风格差异的专项能力。需要调研:AI图像编辑工具是否支持在局部区域以特定手绘风格生成元素并叠加到写实照片上,是否有专门的混合风格图层合成能力。"
  2693. },
  2694. {
  2695. "requirement_id": "REQ_040",
  2696. "requirement_text": "制作图文卡片时,需要让插图与文字在语义上高度呼应——比如用可爱小驴的不同表情和动作配合对应的幽默文字,每张小卡片中图在上、文字在下,插图内容直接反映文字含义,形成一眼就能看懂的图文配合效果",
  2697. "source_subtree": {
  2698. "parent_node": "图文关系",
  2699. "parent_id": 15885,
  2700. "context_path": "/root/呈现/视觉/构图编排/版面设计/图文关系"
  2701. },
  2702. "source_nodes": [
  2703. "图文关联",
  2704. "图文编排"
  2705. ],
  2706. "source_posts": [
  2707. "65febd8e0000000012035538",
  2708. "67206035000000001b02f4b1",
  2709. "6735b1a0000000001b0137f5",
  2710. "67adb23f000000002a00c240",
  2711. "6961b301000000001a02f6af"
  2712. ],
  2713. "matched_capabilities": [
  2714. "CAP-001",
  2715. "CAP-003",
  2716. "CAP-014"
  2717. ],
  2718. "capability_combination": "CAP-001 根据每句幽默文字的语义生成对应表情/动作的小驴插图;CAP-003 保持小驴角色在不同卡片中外观一致;CAP-014 在图像中渲染对应的幽默文字,使文字作为图像视觉元素呈现在插图下方",
  2719. "match_status": "需要调研",
  2720. "needs_research": true,
  2721. "research_note": "CAP-001+CAP-003 可生成语义对应的插图,CAP-014 可在图像内渲染文字,但三者组合仍存在缺口:1)图在上、文字在下的卡片版式排版布局控制(精确的空间分区、留白比例)在现有能力中没有明确支持;2)图文语义精准对应的自动化流程(即根据文字内容自动生成对应插图并排版为卡片)缺乏专项能力支撑;需要调研是否有支持图文版式自动排版的 AI 工具,或是否可通过 ComfyUI 工作流组合实现卡片版式控制"
  2722. },
  2723. {
  2724. "requirement_id": "REQ_041",
  2725. "requirement_text": "制作多图拼贴帖子时,需要将多张照片或截图按照叙事顺序排列在一张大图中,并在关键图片上叠加说明性文字标注,让图片和文字共同讲述一个完整故事,文字起到补充说明和情感点评的作用",
  2726. "source_subtree": {
  2727. "parent_node": "图文关系",
  2728. "parent_id": 15885,
  2729. "context_path": "/root/呈现/视觉/构图编排/版面设计/图文关系"
  2730. },
  2731. "source_nodes": [
  2732. "图文关联",
  2733. "图文编排"
  2734. ],
  2735. "source_posts": [
  2736. "65febd8e0000000012035538",
  2737. "67206035000000001b02f4b1",
  2738. "6735b1a0000000001b0137f5",
  2739. "67adb23f000000002a00c240",
  2740. "6961b301000000001a02f6af"
  2741. ],
  2742. "matched_capabilities": [
  2743. "CAP-014"
  2744. ],
  2745. "capability_combination": "CAP-014 可在图像中渲染文字标注内容,使说明性文字作为视觉元素叠加在图片上",
  2746. "match_status": "需要调研",
  2747. "needs_research": true,
  2748. "research_note": "CAP-014 仅能在单张生成图像中渲染文字,但该需求的核心是:1)将多张已有照片/截图按叙事顺序拼合为一张大图(多图拼贴/画布合成能力),现有原子能力表中无明确的多图拼贴排版能力;2)在拼贴大图的指定位置叠加文字标注(精确位置控制的文字叠加);CAP-020 多主体场景合成偏向将多个主体合成到同一场景,与按叙事顺序排列已有图片的拼贴需求不同;需要调研支持多图拼贴画布排版、图片网格布局生成的 AI 工具或 ComfyUI 节点方案"
  2749. },
  2750. {
  2751. "requirement_id": "REQ_042",
  2752. "requirement_text": "制作信息图文海报时,需要将大标题、分类小标题与正文段落按照清晰的层级排布在版面上,标题用大字醒目展示,正文紧跟其下,整体版面分区明确、图文对应,让读者能快速扫读获取信息",
  2753. "source_subtree": {
  2754. "parent_node": "图文关系",
  2755. "parent_id": 15885,
  2756. "context_path": "/root/呈现/视觉/构图编排/版面设计/图文关系"
  2757. },
  2758. "source_nodes": [
  2759. "图文编排",
  2760. "图文关联"
  2761. ],
  2762. "source_posts": [
  2763. "65febd8e0000000012035538",
  2764. "67206035000000001b02f4b1",
  2765. "6735b1a0000000001b0137f5",
  2766. "67adb23f000000002a00c240",
  2767. "6961b301000000001a02f6af"
  2768. ],
  2769. "matched_capabilities": [
  2770. "CAP-001",
  2771. "CAP-014"
  2772. ],
  2773. "capability_combination": "CAP-001 生成海报的背景图像和视觉元素;CAP-014 在图像中渲染标题、小标题和正文等多层级文字内容",
  2774. "match_status": "需要调研",
  2775. "needs_research": true,
  2776. "research_note": "CAP-001 可生成海报视觉背景,CAP-014 可渲染文字,但该需求的核心挑战在于:1)多层级文字排版(大标题/小标题/正文的字号差异、层级关系、间距控制)的精确版式设计能力,现有 CAP-014 主要针对短文字渲染,对复杂多层级段落排版的支持未有明确说明;2)版面分区明确、图文对应的结构化信息图布局控制,需要精确的空间分区能力;需要调研 Nano Banana Pro 或其他工具对复杂多层级排版信息图海报的支持程度,以及是否有专项的信息图生成能力"
  2777. },
  2778. {
  2779. "requirement_id": "REQ_058",
  2780. "requirement_text": "生成具有强烈透视纵深感的室内空间图,画面中窗框、拱门、地板线条等建筑元素形成明显的空间层次,光线从远处窗口射入,营造出由近到远的视觉延伸效果",
  2781. "source_subtree": {
  2782. "parent_node": "构图方式",
  2783. "parent_id": 15365,
  2784. "context_path": "/root/呈现/视觉/构图编排/空间布局/构图方式"
  2785. },
  2786. "source_nodes": [
  2787. "透视纵深"
  2788. ],
  2789. "source_posts": [
  2790. "664599b9000000001e01d218",
  2791. "67e37ff8000000001c008b5e",
  2792. "682a8f11000000002002a511",
  2793. "6879f4b1000000000b02c2e0",
  2794. "692a535f0000000019026d5b"
  2795. ],
  2796. "matched_capabilities": [
  2797. "CAP-001"
  2798. ],
  2799. "capability_combination": "使用 CAP-001 文本到图像生成,通过精细的提示词描述透视纵深构图(如 vanishing point perspective、leading lines、depth of field 等关键词),结合 Midjourney v8 或 FLUX.2 [max] 的照片级真实感输出,可直接生成具有强烈透视纵深感的室内空间图,包含窗框、拱门、地板线条等建筑元素及从远处窗口射入的光线效果。",
  2800. "match_status": "完全满足",
  2801. "needs_research": false,
  2802. "research_note": ""
  2803. },
  2804. {
  2805. "requirement_id": "REQ_059",
  2806. "requirement_text": "生成采用夸张变形构图的图片,例如鱼眼镜头效果将人物或场景扭曲成球形全景、仰拍使近处物体极度放大而远处极度缩小,或通过搞怪角度让画面产生强烈的视觉冲击感",
  2807. "source_subtree": {
  2808. "parent_node": "构图方式",
  2809. "parent_id": 15365,
  2810. "context_path": "/root/呈现/视觉/构图编排/空间布局/构图方式"
  2811. },
  2812. "source_nodes": [
  2813. "夸张变形"
  2814. ],
  2815. "source_posts": [
  2816. "664599b9000000001e01d218",
  2817. "67e37ff8000000001c008b5e",
  2818. "682a8f11000000002002a511",
  2819. "6879f4b1000000000b02c2e0",
  2820. "692a535f0000000019026d5b"
  2821. ],
  2822. "matched_capabilities": [
  2823. "CAP-001"
  2824. ],
  2825. "capability_combination": "使用 CAP-001 文本到图像生成,通过提示词描述鱼眼镜头(fisheye lens)、极端广角变形(extreme wide angle distortion)、仰拍透视(worm's eye view)等效果,Midjourney v8 或 FLUX.2 [max] 对此类摄影/光学效果的提示词遵循性较强,可生成夸张变形构图图像。",
  2826. "match_status": "完全满足",
  2827. "needs_research": false,
  2828. "research_note": ""
  2829. },
  2830. {
  2831. "requirement_id": "REQ_060",
  2832. "requirement_text": "生成画面中存在嵌套框架效果的图片,如在沙漠场景中用一个悬空的矩形框将主体框住形成画中画,或利用水面倒影与实景上下对称形成嵌套镜像构图,制造超现实的空间突破感",
  2833. "source_subtree": {
  2834. "parent_node": "构图方式",
  2835. "parent_id": 15365,
  2836. "context_path": "/root/呈现/视觉/构图编排/空间布局/构图方式"
  2837. },
  2838. "source_nodes": [
  2839. "嵌套突破",
  2840. "对称分割"
  2841. ],
  2842. "source_posts": [
  2843. "664599b9000000001e01d218",
  2844. "67e37ff8000000001c008b5e",
  2845. "682a8f11000000002002a511",
  2846. "6879f4b1000000000b02c2e0",
  2847. "692a535f0000000019026d5b"
  2848. ],
  2849. "matched_capabilities": [
  2850. "CAP-001"
  2851. ],
  2852. "capability_combination": "使用 CAP-001 文本到图像生成,通过提示词描述嵌套框架(nested frame、picture within picture)、悬空矩形框(floating rectangular frame)、水面镜像对称(mirror reflection symmetry)等超现实构图概念,Midjourney v8 或 FLUX.2 [max] 对超现实主义构图有一定支持,可尝试生成此类效果。",
  2853. "match_status": "需要调研",
  2854. "needs_research": true,
  2855. "research_note": "CAP-001 文本到图像生成可以尝试通过提示词描述嵌套框架和对称分割构图,但此类高度精确的超现实空间构图(悬空矩形框精确框住主体、水面倒影与实景精确对称嵌套)对提示词遵循性要求极高,现有能力能否稳定、精确地实现嵌套框架的空间位置关系和对称分割的几何精度存在不确定性。需要调研:1)Midjourney v8 / FLUX.2 [max] 对复杂超现实嵌套构图的实际生成效果;2)是否可结合 CAP-002 结构/姿态控制(ControlNet 深度图或线稿)来精确约束嵌套框架的空间位置;3)是否有专门支持超现实主义构图控制的 AI 工具或 ControlNet 预处理器。"
  2856. },
  2857. {
  2858. "requirement_id": "REQ_097",
  2859. "requirement_text": "制作大字号标题搭配正文内容的图文排版,标题文字极大且颜色鲜艳(红色、黄色等高饱和色),与正文小字形成强烈的大小对比,整体版面信息密度高、视觉冲击力强",
  2860. "source_subtree": {
  2861. "parent_node": "大字报风格",
  2862. "parent_id": 15927,
  2863. "context_path": "/root/呈现/视觉/构图编排/版面设计/字体标题/排版风格/大字报风格"
  2864. },
  2865. "source_nodes": [
  2866. "大字报风格",
  2867. "通用版式",
  2868. "醒目字效"
  2869. ],
  2870. "source_posts": [
  2871. "66c5b638000000001d018e5a",
  2872. "677b5460000000000b00d33e",
  2873. "68737e97000000000d027b81",
  2874. "692fe421000000001f00691a",
  2875. "6965ea53000000000e00f0f1"
  2876. ],
  2877. "matched_capabilities": [
  2878. "CAP-014"
  2879. ],
  2880. "capability_combination": "CAP-014 可在生成图像中嵌入文字内容,Nano Banana Pro 支持复杂排版布局和多语言高保真文本渲染,可在提示词中描述大字号标题+小字正文的排版结构及高饱和色彩要求",
  2881. "match_status": "需要调研",
  2882. "needs_research": true,
  2883. "research_note": "CAP-014 支持图像内文字渲染和复杂排版布局,理论上可通过提示词描述大字报式排版结构(大标题+小正文+高饱和色)来生成。但现有能力描述中未明确说明是否支持:1)精确控制多层级文字大小比例(如标题字号与正文字号的具体倍数关系);2)高信息密度版面中多段正文文字的准确渲染(文字越多,AI渲染出错率越高);3)指定文字颜色(如纯红、纯黄等高饱和色)的精确还原。需要调研 Nano Banana Pro 或其他工具在多层级文字排版、高密度文字内容、精确色彩控制方面的实际表现和限制。"
  2884. },
  2885. {
  2886. "requirement_id": "REQ_098",
  2887. "requirement_text": "在图片上叠加大字幕文字,字体粗大醒目,常带有描边或阴影效果,文字直接覆盖在照片或场景图上,起到强调说明或搞笑点评的作用",
  2888. "source_subtree": {
  2889. "parent_node": "大字报风格",
  2890. "parent_id": 15927,
  2891. "context_path": "/root/呈现/视觉/构图编排/版面设计/字体标题/排版风格/大字报风格"
  2892. },
  2893. "source_nodes": [
  2894. "字幕应用",
  2895. "醒目字效"
  2896. ],
  2897. "source_posts": [
  2898. "66c5b638000000001d018e5a",
  2899. "677b5460000000000b00d33e",
  2900. "68737e97000000000d027b81",
  2901. "692fe421000000001f00691a",
  2902. "6965ea53000000000e00f0f1"
  2903. ],
  2904. "matched_capabilities": [
  2905. "CAP-014"
  2906. ],
  2907. "capability_combination": "CAP-014 支持在生成图像中嵌入文字,可通过提示词描述粗体大字幕叠加在场景图上的效果,Nano Banana Pro 支持复杂排版布局",
  2908. "match_status": "需要调研",
  2909. "needs_research": true,
  2910. "research_note": "CAP-014 的文字渲染能力主要面向生成阶段的文字嵌入(如产品标签、Logo、广告语),但该需求的核心是:1)将大字幕叠加在已有的照片或场景图上(属于图像编辑/合成场景,而非从零生成);2)需要精确控制描边、阴影等字效样式;3)文字需覆盖在指定位置的已有图像上。现有能力中 CAP-012(图像局部重绘)可对已有图像进行编辑,但其定位是内容替换而非文字叠加。需要调研:是否有 AI 工具支持在已有图片上精确叠加带描边/阴影效果的大字幕文字,或是否需要结合图像编辑工具(如 Photoshop、Canva 等非 AI 生成工具)来实现字效叠加。"
  2911. },
  2912. {
  2913. "requirement_id": "REQ_099",
  2914. "requirement_text": "制作多宫格拼贴式内容图,每个格子内有大标题文字突出显示核心信息(如价格、品类名),配合产品图或场景图,标题字号远大于说明文字,形成层次分明的视觉结构",
  2915. "source_subtree": {
  2916. "parent_node": "大字报风格",
  2917. "parent_id": 15927,
  2918. "context_path": "/root/呈现/视觉/构图编排/版面设计/字体标题/排版风格/大字报风格"
  2919. },
  2920. "source_nodes": [
  2921. "通用版式",
  2922. "大字报风格",
  2923. "醒目字效"
  2924. ],
  2925. "source_posts": [
  2926. "66c5b638000000001d018e5a",
  2927. "677b5460000000000b00d33e",
  2928. "68737e97000000000d027b81",
  2929. "692fe421000000001f00691a",
  2930. "6965ea53000000000e00f0f1"
  2931. ],
  2932. "matched_capabilities": [
  2933. "CAP-014",
  2934. "CAP-001"
  2935. ],
  2936. "capability_combination": "CAP-001 可生成产品图或场景图素材,CAP-014 可在图像中嵌入文字内容;理论上可通过提示词描述多宫格拼贴版式+大标题+小说明文字的层次结构来生成整体版面",
  2937. "match_status": "需要调研",
  2938. "needs_research": true,
  2939. "research_note": "该需求涉及多宫格拼贴版式,具体挑战包括:1)多宫格网格布局的精确控制——AI图像生成工具对严格的网格分割、等比格子排列的控制能力存疑,现有能力表中无明确支持多宫格版式布局的能力;2)每个格子内独立的图文组合(产品图+大标题+说明文字)需要在有限空间内精确排布;3)多个格子中文字内容各不相同,高密度多文字渲染的准确率是否足够。CAP-014 的 Nano Banana Pro 支持复杂排版布局,但是否能精确实现多宫格拼贴这类结构化版式尚不明确。需要调研:Nano Banana Pro 或其他工具对多宫格/网格版式的支持程度,以及是否需要借助专业排版工具(如 Figma、Canva)来实现精确的多宫格结构。"
  2940. },
  2941. {
  2942. "requirement_id": "REQ_022",
  2943. "requirement_text": "生成宠物或动物穿戴人类服饰配件(如帽子、围巾)的画面,让动物看起来像在过节或扮演某种角色,整体效果可爱又有趣",
  2944. "source_subtree": {
  2945. "parent_node": "创意造型",
  2946. "parent_id": 15894,
  2947. "context_path": "/root/呈现/视觉/形象塑造/造型装扮/创意造型"
  2948. },
  2949. "source_nodes": [
  2950. "拟人穿戴",
  2951. "主题扮演"
  2952. ],
  2953. "source_posts": [
  2954. "6666b3a10000000015008834",
  2955. "6774ab9a0000000009015a3f",
  2956. "692d3b99000000001e022295",
  2957. "697069b7000000002202d264"
  2958. ],
  2959. "matched_capabilities": [
  2960. "CAP-001"
  2961. ],
  2962. "capability_combination": "使用 CAP-001(文本到图像生成)直接通过提示词描述动物种类、穿戴的服饰配件、节日或角色主题、可爱风格等,Midjourney v8、FLUX.2 [max]、Nano Banana Pro 或 Seedream 5.0 Lite 均可根据提示词生成符合要求的画面",
  2963. "match_status": "完全满足",
  2964. "needs_research": false,
  2965. "research_note": ""
  2966. },
  2967. {
  2968. "requirement_id": "REQ_023",
  2969. "requirement_text": "生成将普通服装或日常物品以夸张搞怪方式穿戴的人物画面,比如把超大号短裤当长袍穿、用篮球短裤模仿古希腊长袍,产生强烈的视觉反差和幽默效果",
  2970. "source_subtree": {
  2971. "parent_node": "创意造型",
  2972. "parent_id": 15894,
  2973. "context_path": "/root/呈现/视觉/形象塑造/造型装扮/创意造型"
  2974. },
  2975. "source_nodes": [
  2976. "夸张变形",
  2977. "创意技法",
  2978. "拟物仿形"
  2979. ],
  2980. "source_posts": [
  2981. "6666b3a10000000015008834",
  2982. "6774ab9a0000000009015a3f",
  2983. "692d3b99000000001e022295",
  2984. "697069b7000000002202d264"
  2985. ],
  2986. "matched_capabilities": [
  2987. "CAP-001"
  2988. ],
  2989. "capability_combination": "使用 CAP-001(文本到图像生成)通过详细提示词描述夸张穿戴方式、物品错位使用场景、视觉反差和幽默风格,Midjourney v8 或 FLUX.2 [max] 对此类创意概念图的提示词遵循性较强,可生成符合要求的幽默反差画面",
  2990. "match_status": "完全满足",
  2991. "needs_research": false,
  2992. "research_note": ""
  2993. },
  2994. {
  2995. "requirement_id": "REQ_024",
  2996. "requirement_text": "生成具有超现实风格的创意合成画面,将人物头部替换为宇宙星云、太极图、粒子爆炸等抽象元素,配合深蓝红色调背景,营造出哲学感或科幻感的视觉冲击",
  2997. "source_subtree": {
  2998. "parent_node": "创意造型",
  2999. "parent_id": 15894,
  3000. "context_path": "/root/呈现/视觉/形象塑造/造型装扮/创意造型"
  3001. },
  3002. "source_nodes": [
  3003. "夸张变形",
  3004. "创意技法",
  3005. "拟物仿形"
  3006. ],
  3007. "source_posts": [
  3008. "6666b3a10000000015008834",
  3009. "6774ab9a0000000009015a3f",
  3010. "692d3b99000000001e022295",
  3011. "697069b7000000002202d264"
  3012. ],
  3013. "matched_capabilities": [
  3014. "CAP-001",
  3015. "CAP-012"
  3016. ],
  3017. "capability_combination": "方案一:使用 CAP-001(文本到图像生成)直接通过提示词描述超现实风格、头部替换为星云/太极图/粒子爆炸的抽象合成效果、深蓝红色调背景及哲学/科幻氛围,Midjourney v8 或 FLUX.2 [max] 对超现实概念图支持较好。方案二:先用 CAP-001 生成人物基础图,再用 CAP-012(图像局部重绘)对头部区域进行蒙版重绘,将头部替换为指定抽象元素,实现更精准的局部替换控制",
  3018. "match_status": "完全满足",
  3019. "needs_research": false,
  3020. "research_note": ""
  3021. },
  3022. {
  3023. "requirement_id": "REQ_078",
  3024. "requirement_text": "在图片上叠加对话气泡或多行说明文字,用于讲述故事背景或补充情节说明,文字带有描边或阴影效果以确保在复杂背景上清晰可读",
  3025. "source_subtree": {
  3026. "parent_node": "标注叠加",
  3027. "parent_id": 15900,
  3028. "context_path": "/root/呈现/视觉/构图编排/版面设计/标注图示/标注叠加"
  3029. },
  3030. "source_nodes": [
  3031. "文字标注",
  3032. "说明标注"
  3033. ],
  3034. "source_posts": [
  3035. "65febd8e0000000012035538",
  3036. "669b52720000000025003596",
  3037. "68a8241a000000001c011403",
  3038. "68ca25bc000000000e023656"
  3039. ],
  3040. "matched_capabilities": [
  3041. "CAP-014"
  3042. ],
  3043. "capability_combination": "CAP-014 支持在图像中嵌入文字内容,但其定位是将文字作为图像视觉元素自然融入场景(如产品标签、标牌),而非在已有图像上叠加带样式效果的对话气泡或说明文字层",
  3044. "match_status": "需要调研",
  3045. "needs_research": true,
  3046. "research_note": "CAP-014 可在生成图像时嵌入文字,但需求的核心是:1)在已有图片上后期叠加对话气泡这类特定UI元素;2)文字需要带有描边/阴影等样式效果以保证可读性;3)多行排版控制。这更接近图像后期合成/排版工具的能力(如 Canva、Photoshop、专用图文排版工具),而非 AI 图像生成能力。需要调研:是否有 AI 工具支持在已有图像上智能叠加带样式的对话气泡和说明文字,或是否有 ComfyUI 节点支持文字描边/阴影叠加合成。"
  3047. },
  3048. {
  3049. "requirement_id": "REQ_079",
  3050. "requirement_text": "制作图文并茂的科普说明卡片,每张卡片包含标题、编号、插图和详细文字说明,整体排版整齐统一,适合分步骤展示教程或知识点",
  3051. "source_subtree": {
  3052. "parent_node": "标注叠加",
  3053. "parent_id": 15900,
  3054. "context_path": "/root/呈现/视觉/构图编排/版面设计/标注图示/标注叠加"
  3055. },
  3056. "source_nodes": [
  3057. "说明标注",
  3058. "专用标注"
  3059. ],
  3060. "source_posts": [
  3061. "65febd8e0000000012035538",
  3062. "669b52720000000025003596",
  3063. "68a8241a000000001c011403",
  3064. "68ca25bc000000000e023656"
  3065. ],
  3066. "matched_capabilities": [
  3067. "CAP-001",
  3068. "CAP-014"
  3069. ],
  3070. "capability_combination": "CAP-001 可生成卡片插图内容,CAP-014 可在图像中嵌入文字;但两者组合仍无法满足多元素结构化排版的需求",
  3071. "match_status": "需要调研",
  3072. "needs_research": true,
  3073. "research_note": "需求的核心是结构化多元素卡片排版:标题+编号+插图+详细文字说明需要在统一模板中精确布局,且多张卡片风格统一。CAP-001 可生成插图,CAP-014 可嵌入文字,但缺少:1)多元素精确定位排版能力(标题区、图片区、文字区的结构化布局);2)统一模板批量生成多张卡片的能力;3)详细多行文字说明的排版控制。这类需求通常需要图文排版工具(如 Canva、Adobe Express)或支持模板化排版的 AI 工具。需要调研:是否有 AI 工具支持基于模板的结构化图文卡片批量生成。"
  3074. },
  3075. {
  3076. "requirement_id": "REQ_080",
  3077. "requirement_text": "在多图拼贴海报上为每个区域叠加带图标的标签(如勾选符号+地点名称),并在整体画面上方添加大标题和副标题文字,形成图文结合的内容合集展示效果",
  3078. "source_subtree": {
  3079. "parent_node": "标注叠加",
  3080. "parent_id": 15900,
  3081. "context_path": "/root/呈现/视觉/构图编排/版面设计/标注图示/标注叠加"
  3082. },
  3083. "source_nodes": [
  3084. "专用标注",
  3085. "文字标注"
  3086. ],
  3087. "source_posts": [
  3088. "65febd8e0000000012035538",
  3089. "669b52720000000025003596",
  3090. "68a8241a000000001c011403",
  3091. "68ca25bc000000000e023656"
  3092. ],
  3093. "matched_capabilities": [
  3094. "CAP-014"
  3095. ],
  3096. "capability_combination": "CAP-014 可在生成图像时嵌入文字,但无法满足多图拼贴布局和在指定区域精确叠加带图标标签的需求",
  3097. "match_status": "需要调研",
  3098. "needs_research": true,
  3099. "research_note": "需求涉及多个复杂能力:1)多图拼贴布局合成(将多张图片按区域排列);2)在每个区域精确叠加带图标的标签(图标+文字组合元素的定位);3)整体画面的层级标题排版。CAP-014 仅支持在生成阶段嵌入文字,无法实现多图拼贴布局和精确的图标+文字标签叠加。需要调研:是否有 AI 工具或 ComfyUI 工作流支持多图拼贴合成并在指定区域叠加图标标签元素,或需结合图文排版工具实现。"
  3100. },
  3101. {
  3102. "requirement_id": "REQ_081",
  3103. "requirement_text": "为多人物展示海报中的每个人物添加姓名和职位标签,并在画面顶部叠加活动主题、专场名称等层级分明的标题文字,整体风格统一、信息密度高",
  3104. "source_subtree": {
  3105. "parent_node": "标注叠加",
  3106. "parent_id": 15900,
  3107. "context_path": "/root/呈现/视觉/构图编排/版面设计/标注图示/标注叠加"
  3108. },
  3109. "source_nodes": [
  3110. "专用标注",
  3111. "引导标注",
  3112. "文字标注"
  3113. ],
  3114. "source_posts": [
  3115. "65febd8e0000000012035538",
  3116. "669b52720000000025003596",
  3117. "68a8241a000000001c011403",
  3118. "68ca25bc000000000e023656"
  3119. ],
  3120. "matched_capabilities": [
  3121. "CAP-014",
  3122. "CAP-020"
  3123. ],
  3124. "capability_combination": "CAP-020 可将多人物合成到同一场景,CAP-014 可在图像中嵌入文字;但两者组合无法实现为每个人物精确定位独立标签并保证层级标题排版的需求",
  3125. "match_status": "需要调研",
  3126. "needs_research": true,
  3127. "research_note": "需求的核心难点在于:1)为海报中每个人物精确定位并叠加对应的姓名+职位标签(需要与人物位置对齐的精确标注);2)多层级标题文字的结构化排版(活动主题、专场名称等层级关系);3)高信息密度下整体风格统一。CAP-014 的文字嵌入是生成阶段的整体融合,难以实现针对每个人物的精确独立标签定位;CAP-020 可处理多人物合成但不涉及标签叠加。需要调研:是否有 AI 工具支持在多人物图像上智能识别人物位置并自动添加对应标签,或需结合排版工具进行后期文字叠加。"
  3128. },
  3129. {
  3130. "requirement_id": "REQ_070",
  3131. "requirement_text": "生成一组多格拼贴图,每格展示同一人物在不同场景/状态下的夸张表情和肢体动作,配合幽默文字标注,整体呈现出戏剧化的情绪起伏效果(如一周心情变化、苦情崩溃、搞笑反应等)",
  3132. "source_subtree": {
  3133. "parent_node": "表演性动作",
  3134. "parent_id": 15938,
  3135. "context_path": "/root/呈现/视觉/形象塑造/人物表现/动作姿态/表演性动作"
  3136. },
  3137. "source_nodes": [
  3138. "夸张表演"
  3139. ],
  3140. "source_posts": [
  3141. "66619827000000000600486f",
  3142. "6752d19b000000000202b816",
  3143. "68d76cd100000000120165e4"
  3144. ],
  3145. "matched_capabilities": [
  3146. "CAP-001",
  3147. "CAP-003",
  3148. "CAP-002",
  3149. "CAP-014"
  3150. ],
  3151. "capability_combination": "CAP-003(图像主体一致性保持)确保同一人物在多格中外观一致;CAP-001(文本到图像生成)根据每格的场景/情绪描述生成对应内容;CAP-002(结构/姿态控制生成)控制每格中人物的夸张肢体动作和姿态;CAP-014(图像内文字渲染)在每格图像中嵌入幽默文字标注;但多格拼贴的版式排布(将多张图拼合为一张网格图)在原子能力表中无明确对应能力",
  3152. "match_status": "需要调研",
  3153. "needs_research": true,
  3154. "research_note": "现有能力可以:用CAP-003保持人物一致性、用CAP-001生成各格内容、用CAP-002控制夸张姿态、用CAP-014添加文字标注。缺少的关键能力是:将多张独立生成的图像自动排版合并为多格拼贴网格图(如2x3、3x3等宫格布局)的能力,原子能力表中无任何工具明确支持多图拼贴版式合成输出。需要调研:是否有AI工具原生支持多格拼贴图一次性生成(如Midjourney的图像网格输出是否可定制为内容差异化的多格)、或是否有图像拼贴合成节点(如ComfyUI中的图像拼接节点)可实现此功能。"
  3155. },
  3156. {
  3157. "requirement_id": "REQ_071",
  3158. "requirement_text": "将动物(如猫咪)与各种食物、道具进行创意合成,给动物添加配饰(帽子、假发、领带等)并嵌入食物场景中,搭配谐音梗或双关文字,制作出拟人化角色扮演的趣味表情包图片",
  3159. "source_subtree": {
  3160. "parent_node": "表演性动作",
  3161. "parent_id": 15938,
  3162. "context_path": "/root/呈现/视觉/形象塑造/人物表现/动作姿态/表演性动作"
  3163. },
  3164. "source_nodes": [
  3165. "角色演绎",
  3166. "夸张表演"
  3167. ],
  3168. "source_posts": [
  3169. "66619827000000000600486f",
  3170. "6752d19b000000000202b816",
  3171. "68d76cd100000000120165e4"
  3172. ],
  3173. "matched_capabilities": [
  3174. "CAP-001",
  3175. "CAP-012",
  3176. "CAP-014",
  3177. "CAP-003"
  3178. ],
  3179. "capability_combination": "CAP-001(文本到图像生成)可直接通过提示词描述动物+配饰+食物场景的组合画面;CAP-012(图像局部重绘)可在已有动物图像上局部添加帽子、假发、领带等配饰元素,或将动物嵌入食物场景;CAP-003(图像主体一致性保持)可在多张表情包中保持同一只猫咪的外观特征一致;CAP-014(图像内文字渲染)可在图像中嵌入谐音梗或双关文字",
  3180. "match_status": "完全满足",
  3181. "needs_research": false,
  3182. "research_note": ""
  3183. }
  3184. ],
  3185. "metadata": {
  3186. "last_updated": "2026-04-02T20:41:20.543512",
  3187. "total_requirements": 99,
  3188. "fully_matched": 44,
  3189. "needs_research": 55
  3190. }
  3191. }