@inproceedings{lin-etal-2026-mptc,
title = "{MPT}c-Bench: Measuring Cross-market Generative Ability of Vision-Language Models via Movie Poster Transcreation",
author = "Lin, Youyuan and
Li, Yuan and
Yu, Yahan and
Cheng, Fei and
Nishida, Shin{'}ya and
Chu, Chenhui",
editor = "Liakata, Maria and
Moreira, Viviane P. and
Zhang, Jiajun and
Jurgens, David",
booktitle = "Findings of the {A}ssociation for {C}omputational {L}inguistics: {ACL} 2026",
month = jul,
year = "2026",
address = "San Diego, California, United States",
publisher = "Association for Computational Linguistics",
url = "https://aclanthology.org/2026.findings-acl.1889/",
pages = "37897--37913",
ISBN = "979-8-89176-395-1",
abstract = "Generative vision-language models (VLMs) can edit and synthesize images, yet their ability to adapt visual assets across markets remains under-evaluated.We study cross-market image transcreation via movie posters, where localization must preserve a movie{'}s identity while matching market-specific design preferences and multilingual typography.We introduce the Movie Poster Transcreation Benchmark (MPTc-Bench), a cross-market benchmark of 582 aligned poster examples spanning 34 target markets, and define two task variants: $\textbf{Surface}$ (text-centric localization) and $\textbf{Deep}$ (preference-level style adaptation).We propose a two-stage planner-editor pipeline in which an VLM planner specifies executable edits and an image editor renders them.We evaluate in a triplet setup (source, human target-market poster, model output) using information-preservation checks, LLM-as-a-judge ratings for aesthetics and target-market fit, and objective similarity signals.Across multiple planners and editors, experiments reveal substantial gaps between model outputs and human target-market posters, highlighting open challenges for market-aware generation.MPTc-Bench enables controlled, quantitative progress on cross-market image editing beyond understanding-centric benchmarks."
}<?xml version="1.0" encoding="UTF-8"?>
<modsCollection xmlns="http://www.loc.gov/mods/v3">
<mods ID="lin-etal-2026-mptc">
<titleInfo>
<title>MPTc-Bench: Measuring Cross-market Generative Ability of Vision-Language Models via Movie Poster Transcreation</title>
</titleInfo>
<name type="personal">
<namePart type="given">Youyuan</namePart>
<namePart type="family">Lin</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Yuan</namePart>
<namePart type="family">Li</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Yahan</namePart>
<namePart type="family">Yu</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Fei</namePart>
<namePart type="family">Cheng</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Shin’ya</namePart>
<namePart type="family">Nishida</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Chenhui</namePart>
<namePart type="family">Chu</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<originInfo>
<dateIssued>2026-07</dateIssued>
</originInfo>
<typeOfResource>text</typeOfResource>
<relatedItem type="host">
<titleInfo>
<title>Findings of the Association for Computational Linguistics: ACL 2026</title>
</titleInfo>
<name type="personal">
<namePart type="given">Maria</namePart>
<namePart type="family">Liakata</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Viviane</namePart>
<namePart type="given">P</namePart>
<namePart type="family">Moreira</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Jiajun</namePart>
<namePart type="family">Zhang</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">David</namePart>
<namePart type="family">Jurgens</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<originInfo>
<publisher>Association for Computational Linguistics</publisher>
<place>
<placeTerm type="text">San Diego, California, United States</placeTerm>
</place>
</originInfo>
<genre authority="marcgt">conference publication</genre>
<identifier type="isbn">979-8-89176-395-1</identifier>
</relatedItem>
<abstract>Generative vision-language models (VLMs) can edit and synthesize images, yet their ability to adapt visual assets across markets remains under-evaluated.We study cross-market image transcreation via movie posters, where localization must preserve a movie’s identity while matching market-specific design preferences and multilingual typography.We introduce the Movie Poster Transcreation Benchmark (MPTc-Bench), a cross-market benchmark of 582 aligned poster examples spanning 34 target markets, and define two task variants: Surface (text-centric localization) and Deep (preference-level style adaptation).We propose a two-stage planner-editor pipeline in which an VLM planner specifies executable edits and an image editor renders them.We evaluate in a triplet setup (source, human target-market poster, model output) using information-preservation checks, LLM-as-a-judge ratings for aesthetics and target-market fit, and objective similarity signals.Across multiple planners and editors, experiments reveal substantial gaps between model outputs and human target-market posters, highlighting open challenges for market-aware generation.MPTc-Bench enables controlled, quantitative progress on cross-market image editing beyond understanding-centric benchmarks.</abstract>
<identifier type="citekey">lin-etal-2026-mptc</identifier>
<location>
<url>https://aclanthology.org/2026.findings-acl.1889/</url>
</location>
<part>
<date>2026-07</date>
<extent unit="page">
<start>37897</start>
<end>37913</end>
</extent>
</part>
</mods>
</modsCollection>
%0 Conference Proceedings
%T MPTc-Bench: Measuring Cross-market Generative Ability of Vision-Language Models via Movie Poster Transcreation
%A Lin, Youyuan
%A Li, Yuan
%A Yu, Yahan
%A Cheng, Fei
%A Nishida, Shin’ya
%A Chu, Chenhui
%Y Liakata, Maria
%Y Moreira, Viviane P.
%Y Zhang, Jiajun
%Y Jurgens, David
%S Findings of the Association for Computational Linguistics: ACL 2026
%D 2026
%8 July
%I Association for Computational Linguistics
%C San Diego, California, United States
%@ 979-8-89176-395-1
%F lin-etal-2026-mptc
%X Generative vision-language models (VLMs) can edit and synthesize images, yet their ability to adapt visual assets across markets remains under-evaluated.We study cross-market image transcreation via movie posters, where localization must preserve a movie’s identity while matching market-specific design preferences and multilingual typography.We introduce the Movie Poster Transcreation Benchmark (MPTc-Bench), a cross-market benchmark of 582 aligned poster examples spanning 34 target markets, and define two task variants: Surface (text-centric localization) and Deep (preference-level style adaptation).We propose a two-stage planner-editor pipeline in which an VLM planner specifies executable edits and an image editor renders them.We evaluate in a triplet setup (source, human target-market poster, model output) using information-preservation checks, LLM-as-a-judge ratings for aesthetics and target-market fit, and objective similarity signals.Across multiple planners and editors, experiments reveal substantial gaps between model outputs and human target-market posters, highlighting open challenges for market-aware generation.MPTc-Bench enables controlled, quantitative progress on cross-market image editing beyond understanding-centric benchmarks.
%U https://aclanthology.org/2026.findings-acl.1889/
%P 37897-37913
Markdown (Informal)
[MPTc-Bench: Measuring Cross-market Generative Ability of Vision-Language Models via Movie Poster Transcreation](https://aclanthology.org/2026.findings-acl.1889/) (Lin et al., Findings 2026)
ACL