﻿<?xml version="1.0" encoding="UTF-8"?>
<modsCollection xmlns="http://www.loc.gov/mods/v3">
<mods ID="ws-2016-vision">
    <titleInfo>
        <title>Proceedings of the 5th Workshop on Vision and Language</title>
    </titleInfo>
    <name type="personal">
        <namePart type="given">Anya</namePart>
        <namePart type="family">Belz</namePart>
        <role>
            <roleTerm authority="marcrelator" type="text">editor</roleTerm>
        </role>
    </name>
    <name type="personal">
        <namePart type="given">Erkut</namePart>
        <namePart type="family">Erdem</namePart>
        <role>
            <roleTerm authority="marcrelator" type="text">editor</roleTerm>
        </role>
    </name>
    <name type="personal">
        <namePart type="given">Krystian</namePart>
        <namePart type="family">Mikolajczyk</namePart>
        <role>
            <roleTerm authority="marcrelator" type="text">editor</roleTerm>
        </role>
    </name>
    <name type="personal">
        <namePart type="given">Katerina</namePart>
        <namePart type="family">Pastra</namePart>
        <role>
            <roleTerm authority="marcrelator" type="text">editor</roleTerm>
        </role>
    </name>
    <originInfo>
        <dateIssued>2016-08</dateIssued>
        <publisher>Association for Computational Linguistics</publisher>
        <place>
            <placeTerm type="text">Berlin, Germany</placeTerm>
        </place>
    </originInfo>
    <typeOfResource>text</typeOfResource>
    <genre authority="marcgt">conference publication</genre>
    <identifier type="citekey">ws-2016-vision</identifier>
    <location>
        <url>https://aclanthology.org/W16-3200/</url>
    </location>
</mods>
<mods ID="elhoseiny-etal-2016-automatic">
    <titleInfo>
        <title>Automatic Annotation of Structured Facts in Images</title>
    </titleInfo>
    <name type="personal">
        <namePart type="given">Mohamed</namePart>
        <namePart type="family">Elhoseiny</namePart>
        <role>
            <roleTerm authority="marcrelator" type="text">author</roleTerm>
        </role>
    </name>
    <name type="personal">
        <namePart type="given">Scott</namePart>
        <namePart type="family">Cohen</namePart>
        <role>
            <roleTerm authority="marcrelator" type="text">author</roleTerm>
        </role>
    </name>
    <name type="personal">
        <namePart type="given">Walter</namePart>
        <namePart type="family">Chang</namePart>
        <role>
            <roleTerm authority="marcrelator" type="text">author</roleTerm>
        </role>
    </name>
    <name type="personal">
        <namePart type="given">Brian</namePart>
        <namePart type="family">Price</namePart>
        <role>
            <roleTerm authority="marcrelator" type="text">author</roleTerm>
        </role>
    </name>
    <name type="personal">
        <namePart type="given">Ahmed</namePart>
        <namePart type="family">Elgammal</namePart>
        <role>
            <roleTerm authority="marcrelator" type="text">author</roleTerm>
        </role>
    </name>
    <originInfo>
        <dateIssued>2016-08</dateIssued>
    </originInfo>
    <typeOfResource>text</typeOfResource>
    <relatedItem type="host">
        <titleInfo>
            <title>Proceedings of the 5th Workshop on Vision and Language</title>
        </titleInfo>
        <name type="personal">
            <namePart type="given">Anya</namePart>
            <namePart type="family">Belz</namePart>
            <role>
                <roleTerm authority="marcrelator" type="text">editor</roleTerm>
            </role>
        </name>
        <name type="personal">
            <namePart type="given">Erkut</namePart>
            <namePart type="family">Erdem</namePart>
            <role>
                <roleTerm authority="marcrelator" type="text">editor</roleTerm>
            </role>
        </name>
        <name type="personal">
            <namePart type="given">Krystian</namePart>
            <namePart type="family">Mikolajczyk</namePart>
            <role>
                <roleTerm authority="marcrelator" type="text">editor</roleTerm>
            </role>
        </name>
        <name type="personal">
            <namePart type="given">Katerina</namePart>
            <namePart type="family">Pastra</namePart>
            <role>
                <roleTerm authority="marcrelator" type="text">editor</roleTerm>
            </role>
        </name>
        <originInfo>
            <publisher>Association for Computational Linguistics</publisher>
            <place>
                <placeTerm type="text">Berlin, Germany</placeTerm>
            </place>
        </originInfo>
        <genre authority="marcgt">conference publication</genre>
    </relatedItem>
    <identifier type="citekey">elhoseiny-etal-2016-automatic</identifier>
    <identifier type="doi">10.18653/v1/W16-3201</identifier>
    <location>
        <url>https://aclanthology.org/W16-3201/</url>
    </location>
    <part>
        <date>2016-08</date>
        <extent unit="page">
            <start>1</start>
            <end>9</end>
        </extent>
    </part>
</mods>
<mods ID="hurlimann-bos-2016-combining">
    <titleInfo>
        <title>Combining Lexical and Spatial Knowledge to Predict Spatial Relations between Objects in Images</title>
    </titleInfo>
    <name type="personal">
        <namePart type="given">Manuela</namePart>
        <namePart type="family">Hürlimann</namePart>
        <role>
            <roleTerm authority="marcrelator" type="text">author</roleTerm>
        </role>
    </name>
    <name type="personal">
        <namePart type="given">Johan</namePart>
        <namePart type="family">Bos</namePart>
        <role>
            <roleTerm authority="marcrelator" type="text">author</roleTerm>
        </role>
    </name>
    <originInfo>
        <dateIssued>2016-08</dateIssued>
    </originInfo>
    <typeOfResource>text</typeOfResource>
    <relatedItem type="host">
        <titleInfo>
            <title>Proceedings of the 5th Workshop on Vision and Language</title>
        </titleInfo>
        <name type="personal">
            <namePart type="given">Anya</namePart>
            <namePart type="family">Belz</namePart>
            <role>
                <roleTerm authority="marcrelator" type="text">editor</roleTerm>
            </role>
        </name>
        <name type="personal">
            <namePart type="given">Erkut</namePart>
            <namePart type="family">Erdem</namePart>
            <role>
                <roleTerm authority="marcrelator" type="text">editor</roleTerm>
            </role>
        </name>
        <name type="personal">
            <namePart type="given">Krystian</namePart>
            <namePart type="family">Mikolajczyk</namePart>
            <role>
                <roleTerm authority="marcrelator" type="text">editor</roleTerm>
            </role>
        </name>
        <name type="personal">
            <namePart type="given">Katerina</namePart>
            <namePart type="family">Pastra</namePart>
            <role>
                <roleTerm authority="marcrelator" type="text">editor</roleTerm>
            </role>
        </name>
        <originInfo>
            <publisher>Association for Computational Linguistics</publisher>
            <place>
                <placeTerm type="text">Berlin, Germany</placeTerm>
            </place>
        </originInfo>
        <genre authority="marcgt">conference publication</genre>
    </relatedItem>
    <identifier type="citekey">hurlimann-bos-2016-combining</identifier>
    <identifier type="doi">10.18653/v1/W16-3202</identifier>
    <location>
        <url>https://aclanthology.org/W16-3202/</url>
    </location>
    <part>
        <date>2016-08</date>
        <extent unit="page">
            <start>10</start>
            <end>18</end>
        </extent>
    </part>
</mods>
<mods ID="hodosh-hockenmaier-2016-focused">
    <titleInfo>
        <title>Focused Evaluation for Image Description with Binary Forced-Choice Tasks</title>
    </titleInfo>
    <name type="personal">
        <namePart type="given">Micah</namePart>
        <namePart type="family">Hodosh</namePart>
        <role>
            <roleTerm authority="marcrelator" type="text">author</roleTerm>
        </role>
    </name>
    <name type="personal">
        <namePart type="given">Julia</namePart>
        <namePart type="family">Hockenmaier</namePart>
        <role>
            <roleTerm authority="marcrelator" type="text">author</roleTerm>
        </role>
    </name>
    <originInfo>
        <dateIssued>2016-08</dateIssued>
    </originInfo>
    <typeOfResource>text</typeOfResource>
    <relatedItem type="host">
        <titleInfo>
            <title>Proceedings of the 5th Workshop on Vision and Language</title>
        </titleInfo>
        <name type="personal">
            <namePart type="given">Anya</namePart>
            <namePart type="family">Belz</namePart>
            <role>
                <roleTerm authority="marcrelator" type="text">editor</roleTerm>
            </role>
        </name>
        <name type="personal">
            <namePart type="given">Erkut</namePart>
            <namePart type="family">Erdem</namePart>
            <role>
                <roleTerm authority="marcrelator" type="text">editor</roleTerm>
            </role>
        </name>
        <name type="personal">
            <namePart type="given">Krystian</namePart>
            <namePart type="family">Mikolajczyk</namePart>
            <role>
                <roleTerm authority="marcrelator" type="text">editor</roleTerm>
            </role>
        </name>
        <name type="personal">
            <namePart type="given">Katerina</namePart>
            <namePart type="family">Pastra</namePart>
            <role>
                <roleTerm authority="marcrelator" type="text">editor</roleTerm>
            </role>
        </name>
        <originInfo>
            <publisher>Association for Computational Linguistics</publisher>
            <place>
                <placeTerm type="text">Berlin, Germany</placeTerm>
            </place>
        </originInfo>
        <genre authority="marcgt">conference publication</genre>
    </relatedItem>
    <identifier type="citekey">hodosh-hockenmaier-2016-focused</identifier>
    <identifier type="doi">10.18653/v1/W16-3203</identifier>
    <location>
        <url>https://aclanthology.org/W16-3203/</url>
    </location>
    <part>
        <date>2016-08</date>
        <extent unit="page">
            <start>19</start>
            <end>28</end>
        </extent>
    </part>
</mods>
<mods ID="kilickaya-etal-2016-leveraging">
    <titleInfo>
        <title>Leveraging Captions in the Wild to Improve Object Detection</title>
    </titleInfo>
    <name type="personal">
        <namePart type="given">Mert</namePart>
        <namePart type="family">Kilickaya</namePart>
        <role>
            <roleTerm authority="marcrelator" type="text">author</roleTerm>
        </role>
    </name>
    <name type="personal">
        <namePart type="given">Nazli</namePart>
        <namePart type="family">Ikizler-Cinbis</namePart>
        <role>
            <roleTerm authority="marcrelator" type="text">author</roleTerm>
        </role>
    </name>
    <name type="personal">
        <namePart type="given">Erkut</namePart>
        <namePart type="family">Erdem</namePart>
        <role>
            <roleTerm authority="marcrelator" type="text">author</roleTerm>
        </role>
    </name>
    <name type="personal">
        <namePart type="given">Aykut</namePart>
        <namePart type="family">Erdem</namePart>
        <role>
            <roleTerm authority="marcrelator" type="text">author</roleTerm>
        </role>
    </name>
    <originInfo>
        <dateIssued>2016-08</dateIssued>
    </originInfo>
    <typeOfResource>text</typeOfResource>
    <relatedItem type="host">
        <titleInfo>
            <title>Proceedings of the 5th Workshop on Vision and Language</title>
        </titleInfo>
        <name type="personal">
            <namePart type="given">Anya</namePart>
            <namePart type="family">Belz</namePart>
            <role>
                <roleTerm authority="marcrelator" type="text">editor</roleTerm>
            </role>
        </name>
        <name type="personal">
            <namePart type="given">Erkut</namePart>
            <namePart type="family">Erdem</namePart>
            <role>
                <roleTerm authority="marcrelator" type="text">editor</roleTerm>
            </role>
        </name>
        <name type="personal">
            <namePart type="given">Krystian</namePart>
            <namePart type="family">Mikolajczyk</namePart>
            <role>
                <roleTerm authority="marcrelator" type="text">editor</roleTerm>
            </role>
        </name>
        <name type="personal">
            <namePart type="given">Katerina</namePart>
            <namePart type="family">Pastra</namePart>
            <role>
                <roleTerm authority="marcrelator" type="text">editor</roleTerm>
            </role>
        </name>
        <originInfo>
            <publisher>Association for Computational Linguistics</publisher>
            <place>
                <placeTerm type="text">Berlin, Germany</placeTerm>
            </place>
        </originInfo>
        <genre authority="marcgt">conference publication</genre>
    </relatedItem>
    <identifier type="citekey">kilickaya-etal-2016-leveraging</identifier>
    <identifier type="doi">10.18653/v1/W16-3204</identifier>
    <location>
        <url>https://aclanthology.org/W16-3204/</url>
    </location>
    <part>
        <date>2016-08</date>
        <extent unit="page">
            <start>29</start>
            <end>38</end>
        </extent>
    </part>
</mods>
<mods ID="alharbi-gotoh-2016-natural">
    <titleInfo>
        <title>Natural Language Descriptions of Human Activities Scenes: Corpus Generation and Analysis</title>
    </titleInfo>
    <name type="personal">
        <namePart type="given">Nouf</namePart>
        <namePart type="family">Alharbi</namePart>
        <role>
            <roleTerm authority="marcrelator" type="text">author</roleTerm>
        </role>
    </name>
    <name type="personal">
        <namePart type="given">Yoshihiko</namePart>
        <namePart type="family">Gotoh</namePart>
        <role>
            <roleTerm authority="marcrelator" type="text">author</roleTerm>
        </role>
    </name>
    <originInfo>
        <dateIssued>2016-08</dateIssued>
    </originInfo>
    <typeOfResource>text</typeOfResource>
    <relatedItem type="host">
        <titleInfo>
            <title>Proceedings of the 5th Workshop on Vision and Language</title>
        </titleInfo>
        <name type="personal">
            <namePart type="given">Anya</namePart>
            <namePart type="family">Belz</namePart>
            <role>
                <roleTerm authority="marcrelator" type="text">editor</roleTerm>
            </role>
        </name>
        <name type="personal">
            <namePart type="given">Erkut</namePart>
            <namePart type="family">Erdem</namePart>
            <role>
                <roleTerm authority="marcrelator" type="text">editor</roleTerm>
            </role>
        </name>
        <name type="personal">
            <namePart type="given">Krystian</namePart>
            <namePart type="family">Mikolajczyk</namePart>
            <role>
                <roleTerm authority="marcrelator" type="text">editor</roleTerm>
            </role>
        </name>
        <name type="personal">
            <namePart type="given">Katerina</namePart>
            <namePart type="family">Pastra</namePart>
            <role>
                <roleTerm authority="marcrelator" type="text">editor</roleTerm>
            </role>
        </name>
        <originInfo>
            <publisher>Association for Computational Linguistics</publisher>
            <place>
                <placeTerm type="text">Berlin, Germany</placeTerm>
            </place>
        </originInfo>
        <genre authority="marcgt">conference publication</genre>
    </relatedItem>
    <identifier type="citekey">alharbi-gotoh-2016-natural</identifier>
    <identifier type="doi">10.18653/v1/W16-3205</identifier>
    <location>
        <url>https://aclanthology.org/W16-3205/</url>
    </location>
    <part>
        <date>2016-08</date>
        <extent unit="page">
            <start>39</start>
            <end>47</end>
        </extent>
    </part>
</mods>
<mods ID="yu-etal-2016-interactively">
    <titleInfo>
        <title>Interactively Learning Visually Grounded Word Meanings from a Human Tutor</title>
    </titleInfo>
    <name type="personal">
        <namePart type="given">Yanchao</namePart>
        <namePart type="family">Yu</namePart>
        <role>
            <roleTerm authority="marcrelator" type="text">author</roleTerm>
        </role>
    </name>
    <name type="personal">
        <namePart type="given">Arash</namePart>
        <namePart type="family">Eshghi</namePart>
        <role>
            <roleTerm authority="marcrelator" type="text">author</roleTerm>
        </role>
    </name>
    <name type="personal">
        <namePart type="given">Oliver</namePart>
        <namePart type="family">Lemon</namePart>
        <role>
            <roleTerm authority="marcrelator" type="text">author</roleTerm>
        </role>
    </name>
    <originInfo>
        <dateIssued>2016-08</dateIssued>
    </originInfo>
    <typeOfResource>text</typeOfResource>
    <relatedItem type="host">
        <titleInfo>
            <title>Proceedings of the 5th Workshop on Vision and Language</title>
        </titleInfo>
        <name type="personal">
            <namePart type="given">Anya</namePart>
            <namePart type="family">Belz</namePart>
            <role>
                <roleTerm authority="marcrelator" type="text">editor</roleTerm>
            </role>
        </name>
        <name type="personal">
            <namePart type="given">Erkut</namePart>
            <namePart type="family">Erdem</namePart>
            <role>
                <roleTerm authority="marcrelator" type="text">editor</roleTerm>
            </role>
        </name>
        <name type="personal">
            <namePart type="given">Krystian</namePart>
            <namePart type="family">Mikolajczyk</namePart>
            <role>
                <roleTerm authority="marcrelator" type="text">editor</roleTerm>
            </role>
        </name>
        <name type="personal">
            <namePart type="given">Katerina</namePart>
            <namePart type="family">Pastra</namePart>
            <role>
                <roleTerm authority="marcrelator" type="text">editor</roleTerm>
            </role>
        </name>
        <originInfo>
            <publisher>Association for Computational Linguistics</publisher>
            <place>
                <placeTerm type="text">Berlin, Germany</placeTerm>
            </place>
        </originInfo>
        <genre authority="marcgt">conference publication</genre>
    </relatedItem>
    <identifier type="citekey">yu-etal-2016-interactively</identifier>
    <identifier type="doi">10.18653/v1/W16-3206</identifier>
    <location>
        <url>https://aclanthology.org/W16-3206/</url>
    </location>
    <part>
        <date>2016-08</date>
        <extent unit="page">
            <start>48</start>
            <end>53</end>
        </extent>
    </part>
</mods>
<mods ID="van-miltenburg-etal-2016-pragmatic">
    <titleInfo>
        <title>Pragmatic Factors in Image Description: The Case of Negations</title>
    </titleInfo>
    <name type="personal">
        <namePart type="given">Emiel</namePart>
        <namePart type="family">van Miltenburg</namePart>
        <role>
            <roleTerm authority="marcrelator" type="text">author</roleTerm>
        </role>
    </name>
    <name type="personal">
        <namePart type="given">Roser</namePart>
        <namePart type="family">Morante</namePart>
        <role>
            <roleTerm authority="marcrelator" type="text">author</roleTerm>
        </role>
    </name>
    <name type="personal">
        <namePart type="given">Desmond</namePart>
        <namePart type="family">Elliott</namePart>
        <role>
            <roleTerm authority="marcrelator" type="text">author</roleTerm>
        </role>
    </name>
    <originInfo>
        <dateIssued>2016-08</dateIssued>
    </originInfo>
    <typeOfResource>text</typeOfResource>
    <relatedItem type="host">
        <titleInfo>
            <title>Proceedings of the 5th Workshop on Vision and Language</title>
        </titleInfo>
        <name type="personal">
            <namePart type="given">Anya</namePart>
            <namePart type="family">Belz</namePart>
            <role>
                <roleTerm authority="marcrelator" type="text">editor</roleTerm>
            </role>
        </name>
        <name type="personal">
            <namePart type="given">Erkut</namePart>
            <namePart type="family">Erdem</namePart>
            <role>
                <roleTerm authority="marcrelator" type="text">editor</roleTerm>
            </role>
        </name>
        <name type="personal">
            <namePart type="given">Krystian</namePart>
            <namePart type="family">Mikolajczyk</namePart>
            <role>
                <roleTerm authority="marcrelator" type="text">editor</roleTerm>
            </role>
        </name>
        <name type="personal">
            <namePart type="given">Katerina</namePart>
            <namePart type="family">Pastra</namePart>
            <role>
                <roleTerm authority="marcrelator" type="text">editor</roleTerm>
            </role>
        </name>
        <originInfo>
            <publisher>Association for Computational Linguistics</publisher>
            <place>
                <placeTerm type="text">Berlin, Germany</placeTerm>
            </place>
        </originInfo>
        <genre authority="marcgt">conference publication</genre>
    </relatedItem>
    <identifier type="citekey">van-miltenburg-etal-2016-pragmatic</identifier>
    <identifier type="doi">10.18653/v1/W16-3207</identifier>
    <location>
        <url>https://aclanthology.org/W16-3207/</url>
    </location>
    <part>
        <date>2016-08</date>
        <extent unit="page">
            <start>54</start>
            <end>59</end>
        </extent>
    </part>
</mods>
<mods ID="pezzelle-etal-2016-building">
    <titleInfo>
        <title>Building a Bagpipe with a Bag and a Pipe: Exploring Conceptual Combination in Vision</title>
    </titleInfo>
    <name type="personal">
        <namePart type="given">Sandro</namePart>
        <namePart type="family">Pezzelle</namePart>
        <role>
            <roleTerm authority="marcrelator" type="text">author</roleTerm>
        </role>
    </name>
    <name type="personal">
        <namePart type="given">Ravi</namePart>
        <namePart type="family">Shekhar</namePart>
        <role>
            <roleTerm authority="marcrelator" type="text">author</roleTerm>
        </role>
    </name>
    <name type="personal">
        <namePart type="given">Raffaella</namePart>
        <namePart type="family">Bernardi</namePart>
        <role>
            <roleTerm authority="marcrelator" type="text">author</roleTerm>
        </role>
    </name>
    <originInfo>
        <dateIssued>2016-08</dateIssued>
    </originInfo>
    <typeOfResource>text</typeOfResource>
    <relatedItem type="host">
        <titleInfo>
            <title>Proceedings of the 5th Workshop on Vision and Language</title>
        </titleInfo>
        <name type="personal">
            <namePart type="given">Anya</namePart>
            <namePart type="family">Belz</namePart>
            <role>
                <roleTerm authority="marcrelator" type="text">editor</roleTerm>
            </role>
        </name>
        <name type="personal">
            <namePart type="given">Erkut</namePart>
            <namePart type="family">Erdem</namePart>
            <role>
                <roleTerm authority="marcrelator" type="text">editor</roleTerm>
            </role>
        </name>
        <name type="personal">
            <namePart type="given">Krystian</namePart>
            <namePart type="family">Mikolajczyk</namePart>
            <role>
                <roleTerm authority="marcrelator" type="text">editor</roleTerm>
            </role>
        </name>
        <name type="personal">
            <namePart type="given">Katerina</namePart>
            <namePart type="family">Pastra</namePart>
            <role>
                <roleTerm authority="marcrelator" type="text">editor</roleTerm>
            </role>
        </name>
        <originInfo>
            <publisher>Association for Computational Linguistics</publisher>
            <place>
                <placeTerm type="text">Berlin, Germany</placeTerm>
            </place>
        </originInfo>
        <genre authority="marcgt">conference publication</genre>
    </relatedItem>
    <identifier type="citekey">pezzelle-etal-2016-building</identifier>
    <identifier type="doi">10.18653/v1/W16-3208</identifier>
    <location>
        <url>https://aclanthology.org/W16-3208/</url>
    </location>
    <part>
        <date>2016-08</date>
        <extent unit="page">
            <start>60</start>
            <end>64</end>
        </extent>
    </part>
</mods>
<mods ID="belz-etal-2016-exploring">
    <titleInfo>
        <title>Exploring Different Preposition Sets, Models and Feature Sets in Automatic Generation of Spatial Image Descriptions</title>
    </titleInfo>
    <name type="personal">
        <namePart type="given">Anja</namePart>
        <namePart type="family">Belz</namePart>
        <role>
            <roleTerm authority="marcrelator" type="text">author</roleTerm>
        </role>
    </name>
    <name type="personal">
        <namePart type="given">Adrian</namePart>
        <namePart type="family">Muscat</namePart>
        <role>
            <roleTerm authority="marcrelator" type="text">author</roleTerm>
        </role>
    </name>
    <name type="personal">
        <namePart type="given">Brandon</namePart>
        <namePart type="family">Birmingham</namePart>
        <role>
            <roleTerm authority="marcrelator" type="text">author</roleTerm>
        </role>
    </name>
    <originInfo>
        <dateIssued>2016-08</dateIssued>
    </originInfo>
    <typeOfResource>text</typeOfResource>
    <relatedItem type="host">
        <titleInfo>
            <title>Proceedings of the 5th Workshop on Vision and Language</title>
        </titleInfo>
        <name type="personal">
            <namePart type="given">Anya</namePart>
            <namePart type="family">Belz</namePart>
            <role>
                <roleTerm authority="marcrelator" type="text">editor</roleTerm>
            </role>
        </name>
        <name type="personal">
            <namePart type="given">Erkut</namePart>
            <namePart type="family">Erdem</namePart>
            <role>
                <roleTerm authority="marcrelator" type="text">editor</roleTerm>
            </role>
        </name>
        <name type="personal">
            <namePart type="given">Krystian</namePart>
            <namePart type="family">Mikolajczyk</namePart>
            <role>
                <roleTerm authority="marcrelator" type="text">editor</roleTerm>
            </role>
        </name>
        <name type="personal">
            <namePart type="given">Katerina</namePart>
            <namePart type="family">Pastra</namePart>
            <role>
                <roleTerm authority="marcrelator" type="text">editor</roleTerm>
            </role>
        </name>
        <originInfo>
            <publisher>Association for Computational Linguistics</publisher>
            <place>
                <placeTerm type="text">Berlin, Germany</placeTerm>
            </place>
        </originInfo>
        <genre authority="marcgt">conference publication</genre>
    </relatedItem>
    <identifier type="citekey">belz-etal-2016-exploring</identifier>
    <identifier type="doi">10.18653/v1/W16-3209</identifier>
    <location>
        <url>https://aclanthology.org/W16-3209/</url>
    </location>
    <part>
        <date>2016-08</date>
        <extent unit="page">
            <start>65</start>
            <end>69</end>
        </extent>
    </part>
</mods>
<mods ID="elliott-etal-2016-multi30k">
    <titleInfo>
        <title>Multi30K: Multilingual English-German Image Descriptions</title>
    </titleInfo>
    <name type="personal">
        <namePart type="given">Desmond</namePart>
        <namePart type="family">Elliott</namePart>
        <role>
            <roleTerm authority="marcrelator" type="text">author</roleTerm>
        </role>
    </name>
    <name type="personal">
        <namePart type="given">Stella</namePart>
        <namePart type="family">Frank</namePart>
        <role>
            <roleTerm authority="marcrelator" type="text">author</roleTerm>
        </role>
    </name>
    <name type="personal">
        <namePart type="given">Khalil</namePart>
        <namePart type="family">Sima’an</namePart>
        <role>
            <roleTerm authority="marcrelator" type="text">author</roleTerm>
        </role>
    </name>
    <name type="personal">
        <namePart type="given">Lucia</namePart>
        <namePart type="family">Specia</namePart>
        <role>
            <roleTerm authority="marcrelator" type="text">author</roleTerm>
        </role>
    </name>
    <originInfo>
        <dateIssued>2016-08</dateIssued>
    </originInfo>
    <typeOfResource>text</typeOfResource>
    <relatedItem type="host">
        <titleInfo>
            <title>Proceedings of the 5th Workshop on Vision and Language</title>
        </titleInfo>
        <name type="personal">
            <namePart type="given">Anya</namePart>
            <namePart type="family">Belz</namePart>
            <role>
                <roleTerm authority="marcrelator" type="text">editor</roleTerm>
            </role>
        </name>
        <name type="personal">
            <namePart type="given">Erkut</namePart>
            <namePart type="family">Erdem</namePart>
            <role>
                <roleTerm authority="marcrelator" type="text">editor</roleTerm>
            </role>
        </name>
        <name type="personal">
            <namePart type="given">Krystian</namePart>
            <namePart type="family">Mikolajczyk</namePart>
            <role>
                <roleTerm authority="marcrelator" type="text">editor</roleTerm>
            </role>
        </name>
        <name type="personal">
            <namePart type="given">Katerina</namePart>
            <namePart type="family">Pastra</namePart>
            <role>
                <roleTerm authority="marcrelator" type="text">editor</roleTerm>
            </role>
        </name>
        <originInfo>
            <publisher>Association for Computational Linguistics</publisher>
            <place>
                <placeTerm type="text">Berlin, Germany</placeTerm>
            </place>
        </originInfo>
        <genre authority="marcgt">conference publication</genre>
    </relatedItem>
    <identifier type="citekey">elliott-etal-2016-multi30k</identifier>
    <identifier type="doi">10.18653/v1/W16-3210</identifier>
    <location>
        <url>https://aclanthology.org/W16-3210/</url>
    </location>
    <part>
        <date>2016-08</date>
        <extent unit="page">
            <start>70</start>
            <end>74</end>
        </extent>
    </part>
</mods>
<mods ID="sorodoc-etal-2016-look">
    <titleInfo>
        <title>“Look, some Green Circles!”: Learning to Quantify from Images</title>
    </titleInfo>
    <name type="personal">
        <namePart type="given">Ionut</namePart>
        <namePart type="family">Sorodoc</namePart>
        <role>
            <roleTerm authority="marcrelator" type="text">author</roleTerm>
        </role>
    </name>
    <name type="personal">
        <namePart type="given">Angeliki</namePart>
        <namePart type="family">Lazaridou</namePart>
        <role>
            <roleTerm authority="marcrelator" type="text">author</roleTerm>
        </role>
    </name>
    <name type="personal">
        <namePart type="given">Gemma</namePart>
        <namePart type="family">Boleda</namePart>
        <role>
            <roleTerm authority="marcrelator" type="text">author</roleTerm>
        </role>
    </name>
    <name type="personal">
        <namePart type="given">Aurélie</namePart>
        <namePart type="family">Herbelot</namePart>
        <role>
            <roleTerm authority="marcrelator" type="text">author</roleTerm>
        </role>
    </name>
    <name type="personal">
        <namePart type="given">Sandro</namePart>
        <namePart type="family">Pezzelle</namePart>
        <role>
            <roleTerm authority="marcrelator" type="text">author</roleTerm>
        </role>
    </name>
    <name type="personal">
        <namePart type="given">Raffaella</namePart>
        <namePart type="family">Bernardi</namePart>
        <role>
            <roleTerm authority="marcrelator" type="text">author</roleTerm>
        </role>
    </name>
    <originInfo>
        <dateIssued>2016-08</dateIssued>
    </originInfo>
    <typeOfResource>text</typeOfResource>
    <relatedItem type="host">
        <titleInfo>
            <title>Proceedings of the 5th Workshop on Vision and Language</title>
        </titleInfo>
        <name type="personal">
            <namePart type="given">Anya</namePart>
            <namePart type="family">Belz</namePart>
            <role>
                <roleTerm authority="marcrelator" type="text">editor</roleTerm>
            </role>
        </name>
        <name type="personal">
            <namePart type="given">Erkut</namePart>
            <namePart type="family">Erdem</namePart>
            <role>
                <roleTerm authority="marcrelator" type="text">editor</roleTerm>
            </role>
        </name>
        <name type="personal">
            <namePart type="given">Krystian</namePart>
            <namePart type="family">Mikolajczyk</namePart>
            <role>
                <roleTerm authority="marcrelator" type="text">editor</roleTerm>
            </role>
        </name>
        <name type="personal">
            <namePart type="given">Katerina</namePart>
            <namePart type="family">Pastra</namePart>
            <role>
                <roleTerm authority="marcrelator" type="text">editor</roleTerm>
            </role>
        </name>
        <originInfo>
            <publisher>Association for Computational Linguistics</publisher>
            <place>
                <placeTerm type="text">Berlin, Germany</placeTerm>
            </place>
        </originInfo>
        <genre authority="marcgt">conference publication</genre>
    </relatedItem>
    <identifier type="citekey">sorodoc-etal-2016-look</identifier>
    <identifier type="doi">10.18653/v1/W16-3211</identifier>
    <location>
        <url>https://aclanthology.org/W16-3211/</url>
    </location>
    <part>
        <date>2016-08</date>
        <extent unit="page">
            <start>75</start>
            <end>79</end>
        </extent>
    </part>
</mods>
<mods ID="mehler-etal-2016-text2voronoi">
    <titleInfo>
        <title>Text2voronoi: An Image-driven Approach to Differential Diagnosis</title>
    </titleInfo>
    <name type="personal">
        <namePart type="given">Alexander</namePart>
        <namePart type="family">Mehler</namePart>
        <role>
            <roleTerm authority="marcrelator" type="text">author</roleTerm>
        </role>
    </name>
    <name type="personal">
        <namePart type="given">Tolga</namePart>
        <namePart type="family">Uslu</namePart>
        <role>
            <roleTerm authority="marcrelator" type="text">author</roleTerm>
        </role>
    </name>
    <name type="personal">
        <namePart type="given">Wahed</namePart>
        <namePart type="family">Hemati</namePart>
        <role>
            <roleTerm authority="marcrelator" type="text">author</roleTerm>
        </role>
    </name>
    <originInfo>
        <dateIssued>2016-08</dateIssued>
    </originInfo>
    <typeOfResource>text</typeOfResource>
    <relatedItem type="host">
        <titleInfo>
            <title>Proceedings of the 5th Workshop on Vision and Language</title>
        </titleInfo>
        <name type="personal">
            <namePart type="given">Anya</namePart>
            <namePart type="family">Belz</namePart>
            <role>
                <roleTerm authority="marcrelator" type="text">editor</roleTerm>
            </role>
        </name>
        <name type="personal">
            <namePart type="given">Erkut</namePart>
            <namePart type="family">Erdem</namePart>
            <role>
                <roleTerm authority="marcrelator" type="text">editor</roleTerm>
            </role>
        </name>
        <name type="personal">
            <namePart type="given">Krystian</namePart>
            <namePart type="family">Mikolajczyk</namePart>
            <role>
                <roleTerm authority="marcrelator" type="text">editor</roleTerm>
            </role>
        </name>
        <name type="personal">
            <namePart type="given">Katerina</namePart>
            <namePart type="family">Pastra</namePart>
            <role>
                <roleTerm authority="marcrelator" type="text">editor</roleTerm>
            </role>
        </name>
        <originInfo>
            <publisher>Association for Computational Linguistics</publisher>
            <place>
                <placeTerm type="text">Berlin, Germany</placeTerm>
            </place>
        </originInfo>
        <genre authority="marcgt">conference publication</genre>
    </relatedItem>
    <identifier type="citekey">mehler-etal-2016-text2voronoi</identifier>
    <identifier type="doi">10.18653/v1/W16-3212</identifier>
    <location>
        <url>https://aclanthology.org/W16-3212/</url>
    </location>
    <part>
        <date>2016-08</date>
        <extent unit="page">
            <start>80</start>
            <end>85</end>
        </extent>
    </part>
</mods>
<mods ID="winn-etal-2016-detecting">
    <titleInfo>
        <title>Detecting Visually Relevant Sentences for Fine-Grained Classification</title>
    </titleInfo>
    <name type="personal">
        <namePart type="given">Olivia</namePart>
        <namePart type="family">Winn</namePart>
        <role>
            <roleTerm authority="marcrelator" type="text">author</roleTerm>
        </role>
    </name>
    <name type="personal">
        <namePart type="given">Madhavan</namePart>
        <namePart type="given">Kavanur</namePart>
        <namePart type="family">Kidambi</namePart>
        <role>
            <roleTerm authority="marcrelator" type="text">author</roleTerm>
        </role>
    </name>
    <name type="personal">
        <namePart type="given">Smaranda</namePart>
        <namePart type="family">Muresan</namePart>
        <role>
            <roleTerm authority="marcrelator" type="text">author</roleTerm>
        </role>
    </name>
    <originInfo>
        <dateIssued>2016-08</dateIssued>
    </originInfo>
    <typeOfResource>text</typeOfResource>
    <relatedItem type="host">
        <titleInfo>
            <title>Proceedings of the 5th Workshop on Vision and Language</title>
        </titleInfo>
        <name type="personal">
            <namePart type="given">Anya</namePart>
            <namePart type="family">Belz</namePart>
            <role>
                <roleTerm authority="marcrelator" type="text">editor</roleTerm>
            </role>
        </name>
        <name type="personal">
            <namePart type="given">Erkut</namePart>
            <namePart type="family">Erdem</namePart>
            <role>
                <roleTerm authority="marcrelator" type="text">editor</roleTerm>
            </role>
        </name>
        <name type="personal">
            <namePart type="given">Krystian</namePart>
            <namePart type="family">Mikolajczyk</namePart>
            <role>
                <roleTerm authority="marcrelator" type="text">editor</roleTerm>
            </role>
        </name>
        <name type="personal">
            <namePart type="given">Katerina</namePart>
            <namePart type="family">Pastra</namePart>
            <role>
                <roleTerm authority="marcrelator" type="text">editor</roleTerm>
            </role>
        </name>
        <originInfo>
            <publisher>Association for Computational Linguistics</publisher>
            <place>
                <placeTerm type="text">Berlin, Germany</placeTerm>
            </place>
        </originInfo>
        <genre authority="marcgt">conference publication</genre>
    </relatedItem>
    <identifier type="citekey">winn-etal-2016-detecting</identifier>
    <identifier type="doi">10.18653/v1/W16-3213</identifier>
    <location>
        <url>https://aclanthology.org/W16-3213/</url>
    </location>
    <part>
        <date>2016-08</date>
        <extent unit="page">
            <start>86</start>
            <end>91</end>
        </extent>
    </part>
</mods>
</modsCollection>
