infographic.json 13.6 KB
Newer Older
raojy's avatar
first  
raojy committed
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
{
  "id": "a92af27a-0106-4c6f-9d1c-f9783b652f44",
  "revision": 0,
  "last_node_id": 7,
  "last_link_id": 5,
  "nodes": [
    {
      "id": 1,
      "type": "SenseNovaU1LocalLoader",
      "pos": [
        -586.4999290408795,
        148.5000079099019
      ],
      "size": [
        500.234375,
        390.625
      ],
      "flags": {},
      "order": 0,
      "mode": 0,
      "inputs": [],
      "outputs": [
        {
          "name": "u1_model",
          "type": "SENSENOVA_U1_LOCAL_MODEL",
          "links": [
            1
          ]
        },
        {
          "name": "model_info_json",
          "type": "STRING",
          "links": null
        }
      ],
      "properties": {
        "Node name for S&R": "SenseNovaU1LocalLoader"
      },
      "widgets_values": [
        "sensenova/SenseNova-U1-8B-MoT-Infographic",
        "",
        "cuda",
        "bfloat16",
        "auto",
        "none",
        "",
        "full",
        ""
      ]
    },
    {
      "id": 2,
      "type": "SenseNovaU1LocalTextToImage",
      "pos": [
        -19.2498760630192,
        149.75002977542277
      ],
      "size": [
        565.953125,
        887.203125
      ],
      "flags": {},
      "order": 3,
      "mode": 0,
      "inputs": [
        {
          "name": "u1_model",
          "type": "SENSENOVA_U1_LOCAL_MODEL",
          "link": 1
        },
        {
          "name": "prompt",
          "type": "STRING",
          "widget": {
            "name": "prompt"
          },
          "link": 5
        }
      ],
      "outputs": [
        {
          "name": "images",
          "type": "IMAGE",
          "links": [
            2
          ]
        },
        {
          "name": "text",
          "type": "STRING",
          "links": null
        },
        {
          "name": "think_text",
          "type": "STRING",
          "links": [
            3
          ]
        },
        {
          "name": "metadata_json",
          "type": "STRING",
          "links": null
        }
      ],
      "properties": {
        "Node name for S&R": "SenseNovaU1LocalTextToImage"
      },
      "widgets_values": [
        "这张信息图的标题是“SenseNova-U1”,采用现代极简科技矩阵风格。整体布局为水平三列网格结构,背景是带有极浅银灰色细密点阵的哑光纯白高级纸张纹理,画面长宽比为16:9。\\n\\n排版采用严谨的视觉层级:主标题使用粗体无衬线黑体字,正文使用清晰的现代等宽字体。配色方案极其克制,以纯白色为底,深炭黑为主视觉文字和边框,浅石板灰用于背景色块和次要信息区分,图标采用精致的银灰色线框绘制。\\n\\n在画面正上方居中位置,使用醒目的深炭黑粗体字排布着大标题“SenseNova-U1”。标题正下方是浅石板灰色的等宽字体副标题“新一代端到端统一多模态大模型家族”。\\n\\n画面主体分为左、中、右三个相等的垂直信息区块,区块之间通过充足的负空间进行物理隔离。\\n\\n左侧区块的主题是概述。顶部有一个银灰色线框绘制的、由放大镜和齿轮交织的图标,旁边是粗体小标题“Overview”。该区块内从上到下垂直排列着三个要点:第一个要点旁边是一个代表文档与照片重叠的极简图标,紧跟着文字“多模态模型家族,统一文本/图像理解和生成”。向下是由两个相连的同心圆组成的架构图标,配有文字“基于NEO-Unify架构(端到端统一理解和生成)”。最下方是一个带有斜线划掉的眼睛和漏斗形状的图标,明确指示文本“无需视觉编码器(VE)和变分自编码器(VAE)”。\\n\\n中间区块展示模型矩阵。顶部是一个包含两个分支节点的树状网络图标,旁边是粗体小标题“两个模型规格”。区块内分为上下两个包裹在浅石板灰色极细边框内的卡片。上方的卡片内画着一个代表高密度的实心几何立方体图标,大字标注“SenseNova-U1-8B-MoT”,下方是等宽字体说明“8B MoT 密集主干模型”。下方的卡片内画着一个带有闪电符号的网状发光大脑图标,大字标注“SenseNova-U1-A3B-MoT”,下方是等宽字体说明“A3B MoT 混合专家(MoE)主干模型”。在这两个独立卡片的正下方,左侧放置一个笑脸轮廓图标搭配文字“将在HF等平台公开”,右侧放置一个带有折角的书面报告图标搭配文字“将发布技术报告”。\\n\\n右侧区块呈现核心优势。顶部是一个代表巅峰的上升阶梯折线图图标,旁边是粗体小标题“Highlights”。该区块内部垂直分布着四个带有浅石板灰底色的长方形色块,每个色块内部左侧对应一个具体的图标,右侧为文字。第一个色块内是一个无缝相连的莫比乌斯环图标,配文“原生统一架构,无VE和VAE”。第二个色块内是一个顶端带有星星的奖杯图标,配文“单一统一模型在理解和生成任务上均达到SOTA性能”。第三个色块内是代表文本行与拍立得照片交替穿插的图标,配文“强大的原生交错推理能力(模型原生生成图像进行推理)”。最后一个色块内是一个被切分出一小块的硬币与详细饼状图结合的图标,配文“能生成复杂信息图表,性价比出色”。",
        "2720x1536|16:9",
        4,
        "none",
        3,
        0,
        1,
        50,
        1,
        42,
        false,
        false
      ]
    },
    {
      "id": 3,
      "type": "PreviewImage",
      "pos": [
        612.0374341866545,
        153.07410621275454
      ],
      "size": [
        614.578125,
        393.609375
      ],
      "flags": {},
      "order": 4,
      "mode": 0,
      "inputs": [
        {
          "name": "images",
          "type": "IMAGE",
          "link": 2
        }
      ],
      "outputs": [],
      "properties": {
        "Node name for S&R": "PreviewImage"
      },
      "widgets_values": []
    },
    {
      "id": 4,
      "type": "PreviewAny",
      "pos": [
        614.1411713052378,
        610.8904862658945
      ],
      "size": [
        606.28125,
        415.96875
      ],
      "flags": {},
      "order": 5,
      "mode": 0,
      "inputs": [
        {
          "name": "source",
          "type": "*",
          "link": 3
        }
      ],
      "outputs": [],
      "properties": {
        "Node name for S&R": "PreviewAny"
      },
      "widgets_values": [
        null,
        null,
        null
      ]
    },
    {
      "id": 6,
      "type": "Note",
      "pos": [
        -874.1990665007161,
        624.8566777241045
      ],
      "size": [
        238.546875,
        133.046875
      ],
      "flags": {},
      "order": 1,
      "mode": 0,
      "inputs": [],
      "outputs": [],
      "properties": {},
      "widgets_values": [
        "This is a prompt enhancement module; you can turn it off if you don't need it."
      ],
      "color": "#432",
      "bgcolor": "#653"
    },
    {
      "id": 7,
      "type": "SenseNovaPromptBuilder",
      "pos": [
        -585.0759757790407,
        605.0166969060281
      ],
      "size": [
        504.09375,
        412.65625
      ],
      "flags": {},
      "order": 2,
      "mode": 0,
      "inputs": [],
      "outputs": [
        {
          "name": "prompt",
          "type": "STRING",
          "links": null
        },
        {
          "name": "usage_json",
          "type": "STRING",
          "links": [
            5
          ]
        },
        {
          "name": "raw_json",
          "type": "STRING",
          "links": null
        }
      ],
      "properties": {
        "Node name for S&R": "SenseNovaPromptBuilder"
      },
      "widgets_values": [
        "生成一张教育预防电信诈骗的信息图",
        "You are a world-renowned \"Senior Visual Information Architect\" and \"AI Image Prompt Engineering Expert.\" You specialize in transforming fragmented or chaotic [Raw Information] into highly structured, professional Infographic Generation Prompts. Your work is defined by rigorous visual logic, precise spatial organization, and an density of useful information.\n\n# Task\nReconstruct the user’s [Raw Information] into a comprehensive visual synthesis prompt (approx. 400-600 words). Your objective is to guide large image models (e.g., Gemini, Midjourney, DALL-E 3) to render an information-dense infographic featuring advanced typography, a vivid visual style, and perfect structural clarity based solely on your textual description.\n\n# Step-by-Step Methodology\n1. **Content Expansion & Textualization**: Analyze the [Raw Information] to extract its core intent.\n    - Detailing: Extract every entity, number, color, and phrase from the [Raw Information]. Do not summarize.\n    - Categorization: Define sub-categories with distinct visual markers.\n    - Density Enrichment: If the input is brief, supplement it with professional annotations, sub-headings, body text and \"Pro-tips\" or \"Key Insights\" related to the topic to maximize the \"information load\".\n2. **Adaptive Structural Analysis**:\n    - User-Defined Priority: First, check if the user has provided specific layout instructions (e.g., \"three-column grid,\" \"horizontal timeline\"). If present, strictly follow these instructions.\n    - Logic-Driven Inference: If no layout is specified, analyze the [Raw Information] for its underlying logic (chronological, hierarchical, process-oriented, or comparative) and design a spatial architecture that best serves that logic.\n3. **Style Tonal Setting**: If no specific style is provided, assign a unique aesthetic that complements the content (e.g., French hand-drawn collage, modern minimalist matrix, or industrial technical blueprint).\n4. **Data Preservation & Encoding**: Ensure all numbers, dates, and proper nouns are 100% preserved. Convert these into explicit visual labels, charts, or callouts within the prompt. Detect the language of the [Raw Information] and use it for 100% of the output. If input is Chinese, output Chinese. If input is English, output English. No mixing.\n\n\n# Strict Constraints\n1. **Strict Language Parity**: Maintain absolute language consistency. If the [Raw Information] is in Chinese, the entire output must be in Chinese; if in English, the output must be in English. No code-switching.\n2. **Fidelity to [Raw Information]**: You are prohibited from omitting any proper nouns, dates, colors, or specific values provided in the input.\n3. **The \"Zero Nonsense\" Rule**: STRICTLY FORBIDDEN to include introductory, summary, or meta-commentary text (e.g., \"Here is the refined prompt...\"). Do not explain design choices or justify element omissions (e.g., do not mention \"implied flow\"). Start the response immediately with the visual description.\n4. **Visual Precision:\n    - Textures: Mandatorily describe background textures (e.g., off-white aged paper, light gray grid, or black halftone shadows).\n    - Typography: Explicitly specify font styles for different hierarchies (e.g., bold serif for titles, condensed mono-space for technical data).\n5. **Text Rendering Protocol**:\n    - Quotes for Content: Every piece of text intended to appear in the image MUST be enclosed in quotes.\n    - No Quotes for Style: NEVER use quotation marks for descriptions of [Style Description], [Layout Structure], colors or any non-textual elements.\n6. **Relational Arrow Logic**: Minimize the use of arrows. Rely on spatial proximity or alignment to imply connectivity. If arrows are requested, avoid generic orientations like \"horizontal.\" Instead, specify their precise starting point and target destination.\n7. **Semantic Icon Correspondence (CRITICAL)**: You must specifically describe the visual content of every icon to ensure it matches the quoted text. (e.g., \"Next to the text 'Apple' is a detailed illustration of a red delicious apple with a green leaf.\") Do not use generic terms like \"an icon\" or \"a graphic\" without specifying what it is.\n8. **No Hexadecimal Codes**: Never use codes like #xxxx. Use descriptive color names (e.g., sage green, deep navy blue, terracotta).\n\n# Output Format (If the [Raw Information] is in Chinese, please translate the following content into Chinese. If the [Raw Information] is in English, please keep the following content in English.)\nThe theme of the infographic is [Subject Name] (or 此信息图的主题是: [Subject Name]), [Style Description]. The overall layout is [Layout Structure], with a background of [Background Details].\nProvide a smooth and fluent description of the prompts for generating professional infographics. The title is: \"Subject Name\",  [Description of elements or icons in the infographic], [Position], and embed the text information within it, enclosed in quotes.\n\n---\nPlease receive the user's [Raw Information] and directly output the restructured professional image generation prompt:",
        "sensenova-6.7-flash-lite",
        0.3,
        1,
        4096,
        120
      ]
    }
  ],
  "links": [
    [
      1,
      1,
      0,
      2,
      0,
      "SENSENOVA_U1_LOCAL_MODEL"
    ],
    [
      2,
      2,
      0,
      3,
      0,
      "IMAGE"
    ],
    [
      3,
      2,
      2,
      4,
      0,
      "STRING"
    ],
    [
      5,
      7,
      1,
      2,
      1,
      "STRING"
    ]
  ],
  "groups": [],
  "config": {},
  "extra": {
    "workflowRendererVersion": "Vue",
    "ds": {
      "scale": 0.6412973759090729,
      "offset": [
        1055.6855096974812,
        19.214707810300403
      ]
    },
    "frontendVersion": "1.39.19",
    "VHS_latentpreview": false,
    "VHS_latentpreviewrate": 0,
    "VHS_MetadataImage": true,
    "VHS_KeepIntermediate": true
  },
  "version": 0.4
}