@inproceedings{joty-etal-2026-multimodal,
title = "Multimodal Large Language Models for Human-{AI} Interaction: Foundations, Agents, and Inclusive Applications",
author = "Joty, Shafiq and
Hoque, Enamul and
Masry, Ahmed and
Gella, Spandana and
Kahou, Samira Ebrahimi",
editor = "Lin, Chenghua and
Paes, Aline and
Wilkens, Rodrigo",
booktitle = "Proceedings of the 19th Conference of the {E}uropean Chapter of the {A}ssociation for {C}omputational {L}inguistics (Volume 6: Tutorial Abstracts)",
month = mar,
year = "2026",
address = "St. Julian's, Malta",
publisher = "Association for Computational Linguistics",
url = "https://aclanthology.org/2026.eacl-tutorials.4/",
pages = "9--11",
ISBN = "979-8-89176-385-2",
abstract = "This tutorial presents foundations, agentic capabilities, and inclusive applications of multimodal large language models, covering architectures, multimodal alignment and reasoning, conversational GUI agents, accessibility, multilingual communication, and responsible deployment."
}<?xml version="1.0" encoding="UTF-8"?>
<modsCollection xmlns="http://www.loc.gov/mods/v3">
<mods ID="joty-etal-2026-multimodal">
<titleInfo>
<title>Multimodal Large Language Models for Human-AI Interaction: Foundations, Agents, and Inclusive Applications</title>
</titleInfo>
<name type="personal">
<namePart type="given">Shafiq</namePart>
<namePart type="family">Joty</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Enamul</namePart>
<namePart type="family">Hoque</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Ahmed</namePart>
<namePart type="family">Masry</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Spandana</namePart>
<namePart type="family">Gella</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Samira</namePart>
<namePart type="given">Ebrahimi</namePart>
<namePart type="family">Kahou</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<originInfo>
<dateIssued>2026-03</dateIssued>
</originInfo>
<typeOfResource>text</typeOfResource>
<relatedItem type="host">
<titleInfo>
<title>Proceedings of the 19th Conference of the European Chapter of the Association for Computational Linguistics (Volume 6: Tutorial Abstracts)</title>
</titleInfo>
<name type="personal">
<namePart type="given">Chenghua</namePart>
<namePart type="family">Lin</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Aline</namePart>
<namePart type="family">Paes</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Rodrigo</namePart>
<namePart type="family">Wilkens</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<originInfo>
<publisher>Association for Computational Linguistics</publisher>
<place>
<placeTerm type="text">St. Julian’s, Malta</placeTerm>
</place>
</originInfo>
<genre authority="marcgt">conference publication</genre>
<identifier type="isbn">979-8-89176-385-2</identifier>
</relatedItem>
<abstract>This tutorial presents foundations, agentic capabilities, and inclusive applications of multimodal large language models, covering architectures, multimodal alignment and reasoning, conversational GUI agents, accessibility, multilingual communication, and responsible deployment.</abstract>
<identifier type="citekey">joty-etal-2026-multimodal</identifier>
<location>
<url>https://aclanthology.org/2026.eacl-tutorials.4/</url>
</location>
<part>
<date>2026-03</date>
<extent unit="page">
<start>9</start>
<end>11</end>
</extent>
</part>
</mods>
</modsCollection>
%0 Conference Proceedings
%T Multimodal Large Language Models for Human-AI Interaction: Foundations, Agents, and Inclusive Applications
%A Joty, Shafiq
%A Hoque, Enamul
%A Masry, Ahmed
%A Gella, Spandana
%A Kahou, Samira Ebrahimi
%Y Lin, Chenghua
%Y Paes, Aline
%Y Wilkens, Rodrigo
%S Proceedings of the 19th Conference of the European Chapter of the Association for Computational Linguistics (Volume 6: Tutorial Abstracts)
%D 2026
%8 March
%I Association for Computational Linguistics
%C St. Julian’s, Malta
%@ 979-8-89176-385-2
%F joty-etal-2026-multimodal
%X This tutorial presents foundations, agentic capabilities, and inclusive applications of multimodal large language models, covering architectures, multimodal alignment and reasoning, conversational GUI agents, accessibility, multilingual communication, and responsible deployment.
%U https://aclanthology.org/2026.eacl-tutorials.4/
%P 9-11
Markdown (Informal)
[Multimodal Large Language Models for Human-AI Interaction: Foundations, Agents, and Inclusive Applications](https://aclanthology.org/2026.eacl-tutorials.4/) (Joty et al., EACL 2026)
ACL