File size: 30,651 Bytes
7c08dc3
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
458
459
460
461
462
463
464
465
466
467
468
469
470
471
472
473
474
475
476
477
478
479
480
481
482
483
484
485
486
487
488
489
490
491
492
493
494
495
496
497
498
499
500
501
502
503
504
505
506
507
508
509
510
511
512
513
514
515
516
517
518
519
520
521
522
523
524
525
526
527
528
529
530
531
532
533
534
535
536
537
538
539
540
541
542
543
544
545
546
547
548
549
550
551
552
553
554
555
556
557
558
559
560
561
562
563
564
565
566
567
568
569
570
571
572
573
574
575
576
577
578
579
580
581
582
583
584
585
586
587
588
589
590
591
592
593
594
595
596
597
598
599
600
601
602
603
604
605
606
607
608
609
610
611
612
613
614
615
616
617
618
619
620
621
622
623
624
625
626
627
628
629
630
631
632
633
634
635
636
637
638
639
640
641
642
643
644
645
646
647
648
649
650
651
652
653
654
655
656
657
658
659
660
661
662
663
664
665
666
667
668
669
670
671
672
673
674
675
676
677
678
679
680
681
682
683
684
685
686
687
# convert.py / build_poster.py  (patched)
# -*- coding: utf-8 -*-
import json, re, pathlib, shutil, os, math

IMAGES_DIR_NAME = "<4o_4o>_images_and_tables"

def find_project_root(start: pathlib.Path) -> pathlib.Path:
    cur = start.resolve()
    for p in [cur] + list(cur.parents):
        if (p / "Paper2Poster").exists() or (p / IMAGES_DIR_NAME).exists() or (p / "test" / "cambridge_template.tex").exists():
            return p
    return cur

SCRIPT_DIR = pathlib.Path(__file__).resolve().parent
ROOT_DIR   = find_project_root(SCRIPT_DIR)
TEST_DIR   = ROOT_DIR / "test"

JSON_PATH        = TEST_DIR / "poster_content.json"
TEMPLATE_PATH    = TEST_DIR / "cambridge_template.tex"
ARRANGEMENT_PATH = TEST_DIR / "arrangement.json"
CAPTION_PATH     = TEST_DIR / "figure_caption.json"

OUTPUT_DIR       = TEST_DIR / "latex_proj"
OUTPUT_PATH      = OUTPUT_DIR / "poster_output_fix.tex"

IMAGES_PARENTS   = [ROOT_DIR / "Paper2Poster", ROOT_DIR]

# ---------- 版式与字号 ----------
BEAMER_SCALE_TARGET   = 1.15
TITLE_SIZE_SINGLE     = r"\Huge"
TITLE_SIZE_WRAP1      = r"\huge"
TITLE_SIZE_WRAP2PLUS  = r"\LARGE"
AUTHOR_SIZE_CMD       = r"\Large"
INSTITUTE_SIZE_CMD    = r"\large"
BLOCK_TITLE_SIZE_CMD  = r"\Large"
BLOCK_BODY_SIZE_CMD   = r"\large"
CAPTION_SIZE_CMD      = r"\normalsize"

BAPOSTER_FONTSCALE_TARGET = 0.31
TITLE_EM_HEIGHT = "6em"
RIGHT_LOGO_FILENAME = "logo.png"

FIG_ENLARGE_FACTOR    = 1.18
FIG_MIN_FRAC          = 0.60
FIG_MAX_FRAC          = 0.98
BASE_FIG_RATIO_LIMIT  = 0.58
TEXT_CHAR_PER_LINE    = 95
LINE_HEIGHT_WEIGHT    = 0.015

RIGHT_LOGO_INNERSEP_CM= 2.0
RIGHT_LOGO_XSHIFT_CM  = -2.0
RIGHT_LOGO_YSHIFT_CM  = 0.0
RIGHT_LOGO_HEIGHT_CM  = 6.0

# ### NEW: beamer 自适应列宽参数(不使用 span=2)
SEP_FRAC_DEFAULT      = 0.02   # 每个分隔列宽占 paperwidth 的比例
LONG_TITLE_THRESHOLD  = 38     # 标题长度阈值,触发加宽该列
W_HEAVY_BOOST         = 0.50   # 最重列的权重增量(默认三列基准权重=1)
COL_FRAC_MIN          = 0.26   # 单列最小占比(经验安全值)
COL_FRAC_MAX          = 0.42   # 单列最大占比(经验安全值)

def escape_text(s: str) -> str:
    if not s: return ""
    rep = {"&": r"\&", "%": r"\%", "$": r"\$", "#": r"\#", "_": r"\_",
           "{": r"\{", "}": r"\}", "~": r"\textasciitilde{}", "^": r"\textasciicircum{}"}
    for k, v in rep.items(): s = s.replace(k, v)
    return s

def soft_wrap_title_for_logo(title: str, first_limit=68, next_limit=72) -> str:
    if not title or len(title) <= first_limit: return title
    def break_at(s: str, limit: int):
        for sep in [": ", " - ", " — ", " – "]:
            idx = s.rfind(sep, 0, limit+1)
            if idx != -1: return s[:idx+len(sep)].rstrip(), s[idx+len(sep):].lstrip()
        idx = s.rfind(" ", 0, limit+1)
        if idx == -1: idx = limit
        return s[:idx].rstrip(), s[idx:].lstrip()
    head, rest = break_at(title, first_limit); parts = [head]
    if rest:
        if len(rest) > next_limit:
            mid, tail = break_at(rest, next_limit); parts.append(mid)
            if tail: parts.append(tail)
        else: parts.append(rest)
    return r" \\ ".join(parts)

def replace_command_balanced(tex: str, cmd: str, new_line: str) -> str:
    m = re.search(rf"\\{cmd}\b", tex)
    if not m: return tex
    i = m.end()
    if i < len(tex) and tex[i] == '[':
        depth = 1; i += 1
        while i < len(tex) and depth:
            if tex[i] == '[': depth += 1
            elif tex[i] == ']': depth -= 1
            i += 1
        while i < len(tex) and tex[i].isspace(): i += 1
    if i >= len(tex) or tex[i] != '{': return tex
    start = m.start(); j = i; depth = 0; end = None
    while j < len(tex):
        if tex[j] == '{': depth += 1
        elif tex[j] == '}':
            depth -= 1
            if depth == 0: end = j; break
        j += 1
    if end is None: return tex
    return tex[:start] + new_line + tex[end+1:]

def detect_template(tex: str) -> str:
    if re.search(r"\\documentclass[^}]*\{baposter\}", tex): return "baposter"
    return "beamer"

def norm_title(s: str) -> str:
    return " ".join((s or "").lower().replace("&", "and").split())

def slug_name(s: str) -> str:
    base = re.sub(r"[^a-z0-9]+", "", norm_title(s))
    return base or "s"

CAP_PREFIX_RE = re.compile(
    r'^\s*(?:figure|fig\.?)\s*\d+(?:\s*[a-z]\)|\s*[a-z])?\s*[::\.\-–—]\s*', re.IGNORECASE
)
def clean_caption_prefix(cap: str) -> str:
    if not cap: return ""
    return CAP_PREFIX_RE.sub("", cap).strip()

# ---------- beamer ----------
def choose_title_size_cmd(wrapped_title: str) -> str:
    br = wrapped_title.count("\\\\")
    return TITLE_SIZE_SINGLE if br==0 else (TITLE_SIZE_WRAP1 if br==1 else TITLE_SIZE_WRAP2PLUS)

def find_env_bounds(tex: str, env: str, start_pos: int):
    pat = re.compile(rf"\\(begin|end)\{{{re.escape(env)}\}}")
    depth = 0; begin_idx = None
    for m in pat.finditer(tex, start_pos):
        if m.group(1) == "begin":
            if depth == 0: begin_idx = m.start()
            depth += 1
        else:
            depth -= 1
            if depth == 0:
                return begin_idx, m.end()
    return None, None

def extract_begin_token_with_options(region: str, env: str) -> str:
    m = re.match(rf"(\\begin\{{{re.escape(env)}\}}\s*(?:\[[^\]]*\])?)", region, re.S)
    return m.group(1) if m else f"\\begin{{{env}}}"

def split_even_continuous(items: list, n_cols: int) -> list[list]:
    n = len(items); base = n // n_cols; rem = n % n_cols
    out=[]; idx=0
    for i in range(n_cols):
        take = base + (1 if i < rem else 0)
        out.append(items[idx:idx+take]); idx += take
    return out

def bump_beamerposter_scale(tex: str, target: float) -> str:
    def repl(m):
        opts = m.group(1)
        opts2 = re.sub(r"scale\s*=\s*[\d.]+", "", opts)
        opts2 = re.sub(r",,", ",", opts2).strip().strip(",")
        opts2 = (opts2 + "," if opts2 else "") + f"scale={target}"
        return f"\\usepackage[{opts2}]{{beamerposter}}"
    return re.sub(r"\\usepackage\[(.*?)\]\{beamerposter\}", repl, tex, flags=re.S)

def inject_font_tweaks_beamer(tex: str, title_size_cmd: str) -> str:
    tweaks = (
        "\n% --- injected font tweaks (beamer) ---\n"
        f"\\setbeamerfont{{title}}{{size={title_size_cmd}}}\n"
        f"\\setbeamerfont{{author}}{{size={AUTHOR_SIZE_CMD}}}\n"
        f"\\setbeamerfont{{institute}}{{size={INSTITUTE_SIZE_CMD}}}\n"
        f"\\setbeamerfont{{block title}}{{size={BLOCK_TITLE_SIZE_CMD}}}\n"
        f"\\setbeamerfont{{block body}}{{size={BLOCK_BODY_SIZE_CMD}}}\n"
        f"\\setbeamerfont{{caption}}{{size={CAPTION_SIZE_CMD}}}\n"
        "\\setlength{\\abovecaptionskip}{4pt}\n"
        "\\setlength{\\belowcaptionskip}{3pt}\n"
    )
    pos = tex.find(r"\begin{document}")
    return tex[:pos] + tweaks + tex[pos:] if pos!=-1 else tex + tweaks

def inject_right_logo_beamer(tex: str) -> str:
    if "logo.png" in tex: return tex
    pos_head = tex.find(r"\addtobeamertemplate{headline}")
    node = (
        f"\n      \\node[anchor=north east, inner sep={RIGHT_LOGO_INNERSEP_CM}cm]"
        f" at ([xshift={RIGHT_LOGO_XSHIFT_CM}cm,yshift={RIGHT_LOGO_YSHIFT_CM}cm]current page.north east)\n"
        f"      {{\\includegraphics[height={RIGHT_LOGO_HEIGHT_CM}cm]{{logo.png}}}};\n"
    )
    if pos_head != -1:
        b,e = find_env_bounds(tex, "tikzpicture", tex.find(r"\begin{tikzpicture}", pos_head))
        if b is not None:
            return tex[:e-len(r"\end{tikzpicture}")] + node + tex[e:]
    add = (
        "\n% --- injected right-top logo (beamer) ---\n"
        "\\addtobeamertemplate{headline}{}\n"
        "{\n"
        "  \\begin{tikzpicture}[remember picture,overlay]\n"
        f"    \\node[anchor=north east, inner sep={RIGHT_LOGO_INNERSEP_CM}cm]"
        f" at ([xshift={RIGHT_LOGO_XSHIFT_CM}cm,yshift={RIGHT_LOGO_YSHIFT_CM}cm]current page.north east)\n"
        f"    {{\\includegraphics[height={RIGHT_LOGO_HEIGHT_CM}cm]{{logo.png}}}};\n"
        "  \\end{tikzpicture}\n"
        "}\n"
    )
    pos = tex.find(r"\begin{document}")
    return tex[:pos] + add + tex[pos:] if pos!=-1 else tex + add

# ### NEW: beamer 注入列宽宏(显式长度,避免偏左/右侧空白)
def inject_beamer_column_widths(tex: str, col_fracs, sep_frac: float) -> str:
    """
    col_fracs: [fA, fB, fC],三列在 paperwidth 上的占比(不含 4 个分隔列)。
    sep_frac:  每个分隔列在 paperwidth 上的占比。
    """
    assert len(col_fracs) == 3
    # 这里直接设定长度为某个 \paperwidth 的比例,避免依赖模板里的 \colwidth / \separatorcolumn
    snippet = (
        "\n% --- injected beamer fixed column widths (auto) ---\n"
        "\\makeatletter\n"
        "\\newlength\\sepwidth\n"
        f"\\setlength\\sepwidth{{{sep_frac:.6f}\\paperwidth}}\n"
        "\\newlength\\colAwidth\\newlength\\colBwidth\\newlength\\colCwidth\n"
        f"\\setlength\\colAwidth{{{col_fracs[0]:.6f}\\paperwidth}}\n"
        f"\\setlength\\colBwidth{{{col_fracs[1]:.6f}\\paperwidth}}\n"
        f"\\setlength\\colCwidth{{{col_fracs[2]:.6f}\\paperwidth}}\n"
        "\\makeatother\n"
    )
    pos = tex.find(r"\begin{document}")
    return tex[:pos] + snippet + tex[pos:] if pos!=-1 else tex + snippet

# ---------- baposter ----------
def bump_baposter_fontscale(tex: str, target: float) -> str:
    def repl(m):
        opt = m.group(1)
        opt2 = re.sub(r"fontscale\s*=\s*[\d.]+", "", opt)
        opt2 = re.sub(r",,", ",", opt2).strip().strip(",")
        opt2 = (opt2 + "," if opt2 else "") + f"fontscale={target}"
        return f"\\documentclass[{opt2}]{{baposter}}"
    return re.sub(r"\\documentclass\[(.*?)\]\{baposter\}", repl, tex, flags=re.S)

def parse_brace_group(tex: str, start: int) -> tuple[int,int]:
    assert tex[start] == '{'
    depth = 0
    for i in range(start, len(tex)):
        if tex[i] == '{': depth += 1
        elif tex[i] == '}':
            depth -= 1
            if depth == 0: return start, i
    return start, start

def set_poster_option(tex: str, key: str, value: str) -> str:
    """在 \begin{poster}{...} 的第一个大括号里插入/替换 key=value。"""
    groups, _ = get_poster_args_ranges(tex)
    if not groups:
        return tex
    s, e = groups[0]  # 第1个 {} 就是 poster 的 options
    opts = tex[s+1:e]
    # 已有就替换;没有就附加
    pat = re.compile(rf'(?<!\w){re.escape(key)}\s*=\s*[^,}}]+')
    if pat.search(opts):
        opts2 = pat.sub(f"{key}={value}", opts)
    else:
        opts_stripped = opts.strip()
        sep = "" if not opts_stripped else ("," if opts_stripped.rstrip().endswith(",") else ",")
        opts2 = opts_stripped + f"{sep}\n{key}={value}"
    return tex[:s+1] + opts2 + tex[e:]

def enforce_baposter_three_columns(tex: str) -> str:
    """强制3列,并调小列间距以铺满页面宽度。"""
    tex = set_poster_option(tex, "columns", "3")
    tex = set_poster_option(tex, "colspacing", "0.6em")  # ← 从 1em 收紧到 0.6em
    return tex

def bump_baposter_margin(tex: str, margin_len: str = "7mm") -> str:
    """
    在 \documentclass[...,margin=<len>]{baposter} 里设置(或替换) margin=<len>。
    """
    def repl(m):
        opts = m.group(1)
        # 删除已有 margin=...
        opts2 = re.sub(r"(?<!\w)margin\s*=\s*[^,\]]+", "", opts)
        # 清理多余逗号
        opts2 = re.sub(r",,", ",", opts2).strip().strip(",")
        # 附加新的 margin
        opts2 = (opts2 + "," if opts2 else "") + f"margin={margin_len}"
        return f"\\documentclass[{opts2}]{{baposter}}"
    return re.sub(r"\\documentclass\[(.*?)\]\{baposter\}", repl, tex, flags=re.S)

def _soft_wrap_box_title(title: str, first_limit=28, next_limit=32) -> str:
    """
    把很长的 headerbox 标题按词边界软换行,返回带 '\\\\' 的字符串。
    """
    t = (title or "").strip()
    if len(t) <= first_limit:
        return t
    def break_at(s, limit):
        for sep in [": ", " - ", " — ", " – ", "· ", " "]:
            idx = s.rfind(sep, 0, limit+1)
            if idx != -1:
                return s[:idx+len(sep)].rstrip(), s[idx+len(sep):].lstrip()
        return s[:limit].rstrip(), s[limit:].lstrip()
    head, rest = break_at(t, first_limit)
    parts = [head]
    if rest:
        if len(rest) > next_limit:
            mid, tail = break_at(rest, next_limit); parts.append(mid)
            if tail: parts.append(tail)
        else:
            parts.append(rest)
    return r" \\ ".join(parts)

def get_poster_args_ranges(tex: str):
    m = re.search(r"\\begin\{poster\}", tex)
    if not m: return None, None
    i = m.end()
    while i < len(tex) and tex[i].isspace(): i += 1
    groups=[]
    for _ in range(5):
        while i < len(tex) and tex[i] != '{': i += 1
        if i>=len(tex): break
        s,e = parse_brace_group(tex, i); groups.append((s,e)); i = e+1
    if len(groups) < 5: return None, None
    insert_after = groups[-1][1] + 1
    return groups, insert_after

def rewrite_baposter_header(tex: str, title_wrapped: str, authors: str, affiliations: str) -> str:
    groups, _ = get_poster_args_ranges(tex)
    if not groups: return tex
    g3s,g3e = groups[2]
    g4s,g4e = groups[3]
    g5s,g5e = groups[4]
    br = title_wrapped.count("\\\\")
    tsize = "\\Huge " if br==0 else ("\\huge " if br==1 else "\\LARGE ")
    new_title_arg = "{\\bfseries " + tsize + "\\textsc{" + escape_text(title_wrapped) + "}" + "}"
    authors_affil = "\\textsc{" + escape_text(authors) + "}"
    if (affiliations or "").strip():
        authors_affil += r"\\ " + "\\textsc{" + escape_text(affiliations) + "}"
    new_authors_arg = "{" + authors_affil + "}"
    right_logo_path = OUTPUT_DIR / RIGHT_LOGO_FILENAME
    if right_logo_path.exists():
        new_right_arg = "{\\includegraphics[height=" + TITLE_EM_HEIGHT + "]{" + RIGHT_LOGO_FILENAME + "}}"
    else:
        new_right_arg = tex[g5s:g5e+1]
    new_tex = tex[:g3s] + new_title_arg + tex[g3e+1:g4s] + new_authors_arg + tex[g4e+1:g5s] + new_right_arg + tex[g5e+1:]
    return new_tex

def wipe_poster_body_and_insert(tex: str, body: str) -> str:
    groups, insert_after = get_poster_args_ranges(tex)
    if not groups: return tex
    pend = tex.find(r"\end{poster}", insert_after)
    if pend == -1: pend = len(tex)
    return tex[:insert_after] + "\n" + body + "\n" + tex[pend:]

def headerbox_text(title: str, name: str, opts: str, body: str) -> str:
    # 标题软换行 + 正确转义(逐行转义,保留换行符)
    wrapped = _soft_wrap_box_title(title)
    safe = " \\\\ ".join(escape_text(p) for p in wrapped.split(r" \\ "))
    return f"\\headerbox{{{safe}}}{{name={name},{opts}}}{{\n{body}\n}}\n\n"

# ---------- 内容 ----------
def format_content_to_latex(content: str) -> str:
    if not content: return ""
    lines = [ln.strip() for ln in content.splitlines() if ln.strip()]
    if lines and all(ln.startswith(("-", "•")) for ln in lines):
        items = [escape_text(ln.lstrip("-• ").strip()) for ln in lines]
        return "\n".join(["\\begin{itemize}", "\\setlength{\\itemsep}{2pt}", "\\setlength{\\parsep}{0pt}"]
                         + [f"\\item {it}" for it in items] + ["\\end{itemize}"])
    return escape_text(" ".join(lines))

def build_header_from_meta(meta: dict):
    raw_title = meta.get('poster_title','') or ''
    wrapped_title = soft_wrap_title_for_logo(raw_title)
    a = meta.get('authors','') or ''
    inst = meta.get('affiliations','') or ''
    return wrapped_title, a, inst

# ---------- arrangement / captions / images ----------
def load_arrangement_and_captions():
    arr = json.loads(ARRANGEMENT_PATH.read_text(encoding="utf-8"))
    panels = arr.get("panel_arrangement", [])
    figures = arr.get("figure_arrangement", [])
    panels_by_id = {p["panel_id"]: p for p in panels if "panel_id" in p}
    cap_full, cap_base = {}, {}
    if CAPTION_PATH.exists():
        caps = json.loads(CAPTION_PATH.read_text(encoding="utf-8"))
        if isinstance(caps, dict):
            for _, v in caps.items():
                imgp = v.get("image_path", ""); cap = v.get("caption", "")
                if imgp:
                    cap_full[imgp] = cap
                    cap_base[os.path.basename(imgp)] = cap
    return panels_by_id, figures, cap_full, cap_base

def resolve_images_parent_dir(sample_paths):
    for parent in IMAGES_PARENTS:
        for sp in sample_paths[:10]:
            if sp:
                p = parent / sp
                if p.exists():
                    return parent
    return IMAGES_PARENTS[0]

def _fallback_search_by_basename(images_parent: pathlib.Path, basename: str) -> pathlib.Path | None:
    # 有限度搜索:只在 <parent>/<4o_4o>_images_and_tables/** 下找第一个同名文件
    root = images_parent / IMAGES_DIR_NAME
    if not root.exists(): return None
    try:
        for p in root.rglob(basename):
            if p.is_file(): return p
    except Exception:
        pass
    return None

def copy_and_get_relpath(figure_path: str, out_tex_path: pathlib.Path, images_parent: pathlib.Path) -> str:
    fig_dir = out_tex_path.parent / "figures"
    fig_dir.mkdir(parents=True, exist_ok=True)
    p = pathlib.Path(figure_path)
    if p.is_absolute():
        src = p
    else:
        if p.parts and p.parts[0] == IMAGES_DIR_NAME:
            src = images_parent / p
        else:
            src = images_parent / IMAGES_DIR_NAME / p
    if not src.exists():
        # 兜底:按 basename 搜索一次
        fb = _fallback_search_by_basename(images_parent, p.name)
        if fb is not None:
            src = fb
    dst = fig_dir / src.name
    try:
        if src.exists() and ((not dst.exists()) or src.stat().st_mtime > dst.stat().st_mtime):
            shutil.copy2(src, dst)
    except Exception:
        pass
    return str(pathlib.Path("figures") / dst.name).replace(os.sep, "/")

def build_figures_for_sections(sections, panels_by_id, figures, cap_full, cap_base):
    sec_name_to_idx = {norm_title(sec.get("title","")): i
                       for i, sec in enumerate(sections)
                       if norm_title(sec.get("title","")) != norm_title("Poster Title & Author")}
    panelid_to_secidx = {}
    for p in panels_by_id.values():
        pname = norm_title(p.get("panel_name",""))
        if pname in sec_name_to_idx:
            panelid_to_secidx[p["panel_id"]] = sec_name_to_idx[pname]
    sec_panel_height = {}; sec_arranged_fig_height = {}
    for pid, p in panels_by_id.items():
        if pid in panelid_to_secidx:
            sidx = panelid_to_secidx[pid]
            sec_panel_height[sidx] = float(p.get("height", 0.0) or 0.0)
            sec_arranged_fig_height[sidx] = 0.0
    sec_figs = {i: [] for i in range(len(sections))}
    for fg in figures:
        pid = fg.get("panel_id")
        if pid not in panelid_to_secidx: continue
        sidx = panelid_to_secidx[pid]
        pinfo = panels_by_id.get(pid, {})
        p_w = float(pinfo.get("width", 1.0) or 1.0)
        f_w = float(fg.get("width", 0.0) or 0.0)
        frac = 0.0 if p_w <= 0 else (f_w / p_w) * 0.95
        width_frac = max(FIG_MIN_FRAC, min(FIG_MAX_FRAC, (frac if frac>0 else 0.6)*FIG_ENLARGE_FACTOR))
        fpath = fg.get("figure_path", "")
        cap_raw = cap_full.get(fpath) or cap_base.get(os.path.basename(fpath)) or ""
        cap = clean_caption_prefix(cap_raw)
        sec_figs[sidx].append({
            "src": fpath, "caption": cap,
            "width_frac": width_frac,
            "order_y": float(fg.get("y", 0.0) or 0.0),
            "arranged_height": float(fg.get("height", 0.0) or 0.0)
        })
        sec_arranged_fig_height[sidx] = sec_arranged_fig_height.get(sidx, 0.0) + float(fg.get("height", 0.0) or 0.0)
    for i in list(sec_figs.keys()):
        sec_figs[i].sort(key=lambda x: x["order_y"])
    for sidx, figs in sec_figs.items():
        if not figs: continue
        panel_h = sec_panel_height.get(sidx, 0.0)
        arranged_h = sec_arranged_fig_height.get(sidx, 0.0)
        content = sections[sidx].get("content","") or ""
        n_chars = len(content.strip().replace("\n"," "))
        n_lines = math.ceil(n_chars / max(1, TEXT_CHAR_PER_LINE))
        text_ratio = n_lines * LINE_HEIGHT_WEIGHT
        ratio_limit = max(0.30, BASE_FIG_RATIO_LIMIT - min(0.25, 0.12 * (n_chars/600.0)))
        cur_ratio = 0.0 if panel_h <= 0 else arranged_h / panel_h
        safety = 0.08
        allowed = max(0.0, ratio_limit - text_ratio - safety)
        if cur_ratio > 0 and allowed > 0 and cur_ratio > allowed:
            scale = allowed / cur_ratio
            for it in figs:
                it["width_frac"] = max(FIG_MIN_FRAC, min(FIG_MAX_FRAC, it["width_frac"] * scale))
    return sec_figs

def figures_to_latex_beamer(fig_list, out_tex_path: pathlib.Path, images_parent: pathlib.Path) -> str:
    chunks=[]
    for it in fig_list:
        rel = copy_and_get_relpath(it["src"], out_tex_path, images_parent)
        w = it["width_frac"]; cap = escape_text(it["caption"] or "")
        chunks.append("\\begin{figure}\n\\centering\n"
                      f"\\includegraphics[width={w:.2f}\\linewidth]{{{rel}}}\n"
                      + (f"\\caption{{{cap}}}\n" if cap else "") + "\\end{figure}\n")
    return "\n".join(chunks)

def figures_to_latex_baposter(fig_list, out_tex_path: pathlib.Path, images_parent: pathlib.Path) -> str:
    chunks=[]
    for it in fig_list:
        rel = copy_and_get_relpath(it["src"], out_tex_path, images_parent)
        basename = os.path.basename(rel)  # 只写文件名
        w = max(0.90, min(0.98, it["width_frac"]))  # 稍微更大
        cap = escape_text(it["caption"] or "")
        chunks.append(
            "\\begin{center}\n"
            +f"\\includegraphics[width={w:.2f}\\linewidth]{{{basename}}}\n"
            + (f"\\captionof{{figure}}{{{cap}}}\n" if cap else "")
            +"\\vspace{-0.2em}\n"
            +"\\end{center}\n"
        )
    return "\n".join(chunks)

# ### NEW: 估算 section 占用(用于 baposter 溢出防护 & beamer 加权)
def _estimate_section_occupancy(section, figs_for_section):
    content = section.get("content","") or ""
    n_chars = len(content.strip().replace("\n"," "))
    n_lines = math.ceil(n_chars / max(1, TEXT_CHAR_PER_LINE))
    text_part = n_lines * LINE_HEIGHT_WEIGHT
    fig_part  = sum(max(0.45, min(0.85, it.get("width_frac", 0.7))) for it in figs_for_section)
    return text_part + fig_part

# ### NEW: beamer 自适应列宽(根据每列最长标题;不使用 span)
def _compute_beamer_col_fracs(sections, per_col_idxs, sep_frac=SEP_FRAC_DEFAULT):
    # 初始权重
    w = [1.0, 1.0, 1.0]
    # 找每列内最长标题
    longest = []
    for col, idxs in enumerate(per_col_idxs):
        if not idxs:
            longest.append(0)
            continue
        longest_title = max(len((sections[i].get("title") or "")) for i in idxs)
        longest.append(longest_title)
    # 给最长的那一列加权
    if longest:
        j = int(max(range(len(longest)), key=lambda k: longest[k] if len(longest)>0 else 0))
        if longest[j] >= LONG_TITLE_THRESHOLD:
            w[j] += W_HEAVY_BOOST
    total_w = sum(w) if sum(w)>0 else 3.0
    # 可用总宽(除去 4 个分隔列)
    usable = 1.0 - 4*sep_frac
    # 归一化并夹紧
    fracs = [max(COL_FRAC_MIN, min(COL_FRAC_MAX, usable * (wi/total_w))) for wi in w]
    # 可能因为夹紧导致和不等于 usable,再次归一化一次以严格填满
    s = sum(fracs)
    if s > 0:
        fracs = [fi * usable / s for fi in fracs]
    return fracs

# ### NEW: baposter 列占用超限时,统一缩放该列图宽,并有溢出则不加 above=bottom
def _rebalance_baposter(secidx_to_figs, sections, per_col_idxs, max_occupancy=0.98):
    col_occupancies = []
    for col, idxs in enumerate(per_col_idxs):
        occ = 0.0
        for sidx in idxs:
            figs = secidx_to_figs.get(sidx, [])
            occ += _estimate_section_occupancy(sections[sidx], figs)
        col_occupancies.append(occ)

    # 对占用超限的列,按比例缩放图片宽度
    for col, (occ, idxs) in enumerate(zip(col_occupancies, per_col_idxs)):
        if occ > max_occupancy and occ > 0:
            scale = max(0.80, min(0.97, max_occupancy / occ))
            for sidx in idxs:
                for it in secidx_to_figs.get(sidx, []):
                    it["width_frac"] = max(FIG_MIN_FRAC, min(FIG_MAX_FRAC, it["width_frac"] * scale))

    # 返回每列是否允许 bottom 对齐(占用安全才允许)
    allow_bottom = [occ <= max_occupancy for occ in col_occupancies]
    return allow_bottom

# ---------- 主流程 ----------
def main():
    OUTPUT_DIR.mkdir(parents=True, exist_ok=True)

    data = json.loads(JSON_PATH.read_text(encoding="utf-8"))
    meta = data.get("meta", {}) or {}
    secs_all = data.get("sections", []) or []
    sections = [s for s in secs_all if norm_title(s.get("title","")) != norm_title("Poster Title & Author")]

    panels_by_id, figures, cap_full, cap_base = load_arrangement_and_captions()
    sample_paths = [pathlib.Path(f.get("figure_path","")) for f in figures if f.get("figure_path")]
    images_parent = resolve_images_parent_dir(sample_paths)

    template = TEMPLATE_PATH.read_text(encoding="utf-8")
    mode = detect_template(template)
    wrapped_title, authors, affiliations = build_header_from_meta(meta)

    if mode == "beamer":
        new_tex = replace_command_balanced(template, "title", f"\\title{{{escape_text(wrapped_title)}}}")
        new_tex = replace_command_balanced(new_tex, "author", f"\\author{{{escape_text(authors)}}}")
        new_tex = replace_command_balanced(new_tex, "institute", f"\\institute[shortinst]{{{escape_text(affiliations)}}}")
        new_tex = bump_beamerposter_scale(new_tex, BEAMER_SCALE_TARGET)
        new_tex = inject_font_tweaks_beamer(new_tex, choose_title_size_cmd(wrapped_title))
        new_tex = inject_right_logo_beamer(new_tex)

        secidx_to_figs = build_figures_for_sections(sections, panels_by_id, figures, cap_full, cap_base)
        blocks=[]
        for i, sec in enumerate(sections):
            figs_tex = figures_to_latex_beamer(secidx_to_figs.get(i, []), OUTPUT_PATH, images_parent) if secidx_to_figs.get(i) else ""
            body = format_content_to_latex(sec.get("content",""))
            if figs_tex: body = (body + "\n\n" if body else "") + figs_tex
            blocks.append(f"\\begin{{block}}{{{escape_text(sec.get('title',''))}}}\n{body}\n\\end{{block}}\n")

        pos_doc = new_tex.find(r"\begin{document}")
        if pos_doc == -1: raise RuntimeError("未找到 \\begin{document}")
        b,e = find_env_bounds(new_tex, "columns", pos_doc)
        if b is None: raise RuntimeError("未在文档主体找到 \\begin{columns} ... \\end{columns}")
        region = new_tex[b:e]
        begin_tok = extract_begin_token_with_options(region, "columns")
        per_col_blocks = split_even_continuous(blocks, 3)

        # ### NEW: 计算自适应列宽,并注入固定长度,避免整体偏左
        col_fracs = _compute_beamer_col_fracs(sections, [list(range(len(x))) for x in split_even_continuous(list(range(len(sections))), 3)], sep_frac=SEP_FRAC_DEFAULT)
        new_tex = inject_beamer_column_widths(new_tex, col_fracs, SEP_FRAC_DEFAULT)

        # ### NEW: 显式插入分隔列(\sepwidth)与三列具体宽度(\colA/B/Cwidth),严格填满
        body_lines=[]
        # leading separator
        body_lines.append(r"\begin{column}{\sepwidth}\end{column}")
        colw_macros = [r"\colAwidth", r"\colBwidth", r"\colCwidth"]
        for i in range(3):
            body_lines.append(r"\begin{column}{\sepwidth}\end{column}")
            body_lines.append(fr"\begin{{column}}{{{colw_macros[i]}}}")
            if per_col_blocks[i]: body_lines.append("\n".join(per_col_blocks[i]))
            body_lines.append(r"\end{column}")
        # trailing separator
        body_lines.append(r"\begin{column}{\sepwidth}\end{column}")

        columns_new = begin_tok + "\n" + "\n".join(body_lines) + "\n\\end{columns}"
        new_tex = new_tex[:b] + columns_new + new_tex[e:]

    else:
        # --- baposter ---
        new_tex = bump_baposter_fontscale(template, BAPOSTER_FONTSCALE_TARGET)

        # 把页面边距压小,让三列更“铺满”
        new_tex = bump_baposter_margin(new_tex, "7mm")   # 你也可以试 "5mm" 或 "10mm"

        new_tex = rewrite_baposter_header(new_tex, wrapped_title, authors, affiliations)
        new_tex = enforce_baposter_three_columns(new_tex)

        # 3 列均匀 + 列底对齐(带溢出防护)
        per_col_idxs = split_even_continuous(list(range(len(sections))), 3)
        secidx_to_figs = build_figures_for_sections(sections, panels_by_id, figures, cap_full, cap_base)

        # ### NEW: 根据每列估算占用,必要时缩放图宽,且仅在安全时对最后一个 headerbox 使用 above=bottom
        allow_bottom = _rebalance_baposter(secidx_to_figs, sections, per_col_idxs, max_occupancy=0.98)

        bodies = []
        for i, sec in enumerate(sections):
            figs_tex = figures_to_latex_baposter(secidx_to_figs.get(i, []), OUTPUT_PATH, images_parent) if secidx_to_figs.get(i) else ""
            bodies.append(format_content_to_latex(sec.get("content","")) + ("\n\n"+figs_tex if figs_tex else ""))

        hb_parts=[]; used=set(); prev={0:None,1:None,2:None}
        for col, idxs in enumerate(per_col_idxs):
            for j, sidx in enumerate(idxs):
                title = sections[sidx].get("title","") or f"Section {sidx+1}"
                base = slug_name(title); name = base; k=1
                while name in used: k+=1; name=f"{base}{k}"
                used.add(name)
                is_first = (prev[col] is None)
                is_last  = (j == len(idxs)-1)
                if is_first:
                    opts = f"column={col},row=0,span=1"
                else:
                    opts = f"column={col},below={prev[col]},span=1"
                # 仅当该列估算占用安全时,才将最后一个 box 固定到底部,避免溢出重叠
                if is_last and allow_bottom[col]:
                    opts += ",above=bottom"
                hb_parts.append(headerbox_text(title, name, opts, bodies[sidx]))
                prev[col] = name

        body_all = "\n".join(hb_parts)
        new_tex = wipe_poster_body_and_insert(new_tex, body_all)

    OUTPUT_PATH.write_text(new_tex, encoding="utf-8")
    print(f"✅ Wrote: {OUTPUT_PATH.relative_to(ROOT_DIR)}")
    print(f"📁 Figures copied to: {OUTPUT_DIR / 'figures'}")
    print(f"🧩 Template detected: {mode}")

if __name__ == "__main__":
    main()