<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD JATS (Z39.96) Journal Publishing DTD v1.3 20210610//EN" "JATS-journalpublishing1-3-mathml3.dtd">
<article article-type="brief-report" xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" xmlns:ali="http://www.niso.org/schemas/ali/1.0/" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" dtd-version="1.3" xml:lang="EN">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Artif. Intell.</journal-id>
<journal-title-group>
<journal-title>Frontiers in Artificial Intelligence</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Artif. Intell.</abbrev-journal-title>
</journal-title-group>
<issn pub-type="epub">2624-8212</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="doi">10.3389/frai.2026.1753041</article-id>
<article-version article-version-type="Version of Record" vocab="NISO-RP-8-2008"/>
<article-categories>
<subj-group subj-group-type="heading"><subject>Perspective</subject></subj-group>
</article-categories>
<title-group>
<article-title>Computational hermeneutics: evaluating generative AI as a cultural technology</article-title>
</title-group>
<contrib-group>
<contrib contrib-type="author" corresp="yes">
<name>
<surname>Kommers</surname>
<given-names>Cody</given-names>
</name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="corresp" rid="c001"><sup>&#x002A;</sup></xref>
<uri xlink:href="https://loop.frontiersin.org/people/3291808"/>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; original draft" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-original-draft/">Writing &#x2013; original draft</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &amp; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &#x0026; editing</role>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Ahnert</surname>
<given-names>Ruth</given-names>
</name>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; original draft" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-original-draft/">Writing &#x2013; original draft</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &amp; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &#x0026; editing</role>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Antoniak</surname>
<given-names>Maria</given-names>
</name>
<xref ref-type="aff" rid="aff3"><sup>3</sup></xref>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &amp; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &#x0026; editing</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; original draft" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-original-draft/">Writing &#x2013; original draft</role>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Benetos</surname>
<given-names>Emmanouil</given-names>
</name>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
<uri xlink:href="https://loop.frontiersin.org/people/538210"/>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &amp; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &#x0026; editing</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; original draft" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-original-draft/">Writing &#x2013; original draft</role>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Benford</surname>
<given-names>Steve</given-names>
</name>
<xref ref-type="aff" rid="aff4"><sup>4</sup></xref>
<uri xlink:href="https://loop.frontiersin.org/people/3333751"/>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &amp; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &#x0026; editing</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; original draft" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-original-draft/">Writing &#x2013; original draft</role>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Bunz</surname>
<given-names>Mercedes</given-names>
</name>
<xref ref-type="aff" rid="aff5"><sup>5</sup></xref>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &amp; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &#x0026; editing</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; original draft" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-original-draft/">Writing &#x2013; original draft</role>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Caramiaux</surname>
<given-names>Baptiste</given-names>
</name>
<xref ref-type="aff" rid="aff6"><sup>6</sup></xref>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &amp; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &#x0026; editing</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; original draft" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-original-draft/">Writing &#x2013; original draft</role>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Concannon</surname>
<given-names>Shauna</given-names>
</name>
<xref ref-type="aff" rid="aff7"><sup>7</sup></xref>
<uri xlink:href="https://loop.frontiersin.org/people/2325556"/>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &amp; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &#x0026; editing</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; original draft" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-original-draft/">Writing &#x2013; original draft</role>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Disley</surname>
<given-names>Martin</given-names>
</name>
<xref ref-type="aff" rid="aff8"><sup>8</sup></xref>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &amp; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &#x0026; editing</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; original draft" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-original-draft/">Writing &#x2013; original draft</role>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Dobson</surname>
<given-names>James</given-names>
</name>
<xref ref-type="aff" rid="aff9"><sup>9</sup></xref>
<uri xlink:href="https://loop.frontiersin.org/people/3391099/overview"/>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &amp; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &#x0026; editing</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; original draft" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-original-draft/">Writing &#x2013; original draft</role>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Du</surname>
<given-names>Yali</given-names>
</name>
<xref ref-type="aff" rid="aff5"><sup>5</sup></xref>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &amp; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &#x0026; editing</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; original draft" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-original-draft/">Writing &#x2013; original draft</role>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Du&#x00E9;&#x00F1;ez-Guzm&#x00E1;n</surname>
<given-names>Edgar</given-names>
</name>
<xref ref-type="aff" rid="aff10"><sup>10</sup></xref>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &amp; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &#x0026; editing</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; original draft" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-original-draft/">Writing &#x2013; original draft</role>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Francksen</surname>
<given-names>Kerry</given-names>
</name>
<xref ref-type="aff" rid="aff11"><sup>11</sup></xref>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &amp; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &#x0026; editing</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; original draft" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-original-draft/">Writing &#x2013; original draft</role>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Gius</surname>
<given-names>Evelyn</given-names>
</name>
<xref ref-type="aff" rid="aff12"><sup>12</sup></xref>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &amp; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &#x0026; editing</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; original draft" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-original-draft/">Writing &#x2013; original draft</role>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Gray</surname>
<given-names>Jonathan W. Y.</given-names>
</name>
<xref ref-type="aff" rid="aff5"><sup>5</sup></xref>
<uri xlink:href="https://loop.frontiersin.org/people/931465"/>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; original draft" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-original-draft/">Writing &#x2013; original draft</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &amp; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &#x0026; editing</role>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Heuser</surname>
<given-names>Ryan</given-names>
</name>
<xref ref-type="aff" rid="aff13"><sup>13</sup></xref>
<uri xlink:href="https://loop.frontiersin.org/people/3371879"/>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &amp; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &#x0026; editing</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; original draft" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-original-draft/">Writing &#x2013; original draft</role>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Immel</surname>
<given-names>Sarah</given-names>
</name>
<xref ref-type="aff" rid="aff8"><sup>8</sup></xref>
<uri xlink:href="https://loop.frontiersin.org/people/3371776"/>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &amp; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &#x0026; editing</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; original draft" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-original-draft/">Writing &#x2013; original draft</role>
</contrib>
<contrib contrib-type="author">
<name>
<surname>So</surname>
<given-names>Richard Jean</given-names>
</name>
<xref ref-type="aff" rid="aff14"><sup>14</sup></xref>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; original draft" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-original-draft/">Writing &#x2013; original draft</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &amp; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &#x0026; editing</role>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Leigh</surname>
<given-names>Sang</given-names>
</name>
<xref ref-type="aff" rid="aff15"><sup>15</sup></xref>
<uri xlink:href="https://loop.frontiersin.org/people/3294239"/>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &amp; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &#x0026; editing</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; original draft" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-original-draft/">Writing &#x2013; original draft</role>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Livingston</surname>
<given-names>Dalaki</given-names>
</name>
<xref ref-type="aff" rid="aff16"><sup>16</sup></xref>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &amp; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &#x0026; editing</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; original draft" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-original-draft/">Writing &#x2013; original draft</role>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Long</surname>
<given-names>Hoyt</given-names>
</name>
<xref ref-type="aff" rid="aff17"><sup>17</sup></xref>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; original draft" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-original-draft/">Writing &#x2013; original draft</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &amp; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &#x0026; editing</role>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Martin</surname>
<given-names>Meredith</given-names>
</name>
<xref ref-type="aff" rid="aff18"><sup>18</sup></xref>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &amp; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &#x0026; editing</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; original draft" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-original-draft/">Writing &#x2013; original draft</role>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Meyer</surname>
<given-names>Georgia</given-names>
</name>
<xref ref-type="aff" rid="aff19"><sup>19</sup></xref>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &amp; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &#x0026; editing</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; original draft" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-original-draft/">Writing &#x2013; original draft</role>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Mihai</surname>
<given-names>Daniela</given-names>
</name>
<xref ref-type="aff" rid="aff20"><sup>20</sup></xref>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &amp; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &#x0026; editing</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; original draft" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-original-draft/">Writing &#x2013; original draft</role>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Noel-Hirst</surname>
<given-names>Ashley</given-names>
</name>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &amp; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &#x0026; editing</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; original draft" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-original-draft/">Writing &#x2013; original draft</role>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Ostherr</surname>
<given-names>Kirsten</given-names>
</name>
<xref ref-type="aff" rid="aff21"><sup>21</sup></xref>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &amp; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &#x0026; editing</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; original draft" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-original-draft/">Writing &#x2013; original draft</role>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Parker</surname>
<given-names>Deven</given-names>
</name>
<xref ref-type="aff" rid="aff22"><sup>22</sup></xref>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; original draft" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-original-draft/">Writing &#x2013; original draft</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &amp; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &#x0026; editing</role>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Qin</surname>
<given-names>Yipeng</given-names>
</name>
<xref ref-type="aff" rid="aff23"><sup>23</sup></xref>
<uri xlink:href="https://loop.frontiersin.org/people/1803603"/>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &amp; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &#x0026; editing</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; original draft" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-original-draft/">Writing &#x2013; original draft</role>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Ratcliff</surname>
<given-names>Jessica</given-names>
</name>
<xref ref-type="aff" rid="aff15"><sup>15</sup></xref>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &amp; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &#x0026; editing</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; original draft" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-original-draft/">Writing &#x2013; original draft</role>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Robinson</surname>
<given-names>Emily</given-names>
</name>
<xref ref-type="aff" rid="aff24"><sup>24</sup></xref>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; original draft" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-original-draft/">Writing &#x2013; original draft</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &amp; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &#x0026; editing</role>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Rodriguez</surname>
<given-names>Karina</given-names>
</name>
<xref ref-type="aff" rid="aff25"><sup>25</sup></xref>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &amp; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &#x0026; editing</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; original draft" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-original-draft/">Writing &#x2013; original draft</role>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Sobey</surname>
<given-names>Adam</given-names>
</name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="aff" rid="aff20"><sup>20</sup></xref>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; original draft" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-original-draft/">Writing &#x2013; original draft</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &amp; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &#x0026; editing</role>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Underwood</surname>
<given-names>Ted</given-names>
</name>
<xref ref-type="aff" rid="aff26"><sup>26</sup></xref>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; original draft" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-original-draft/">Writing &#x2013; original draft</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &amp; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &#x0026; editing</role>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Vashistha</surname>
<given-names>Aditya</given-names>
</name>
<xref ref-type="aff" rid="aff15"><sup>15</sup></xref>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &amp; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &#x0026; editing</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; original draft" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-original-draft/">Writing &#x2013; original draft</role>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Wilkens</surname>
<given-names>Matthew</given-names>
</name>
<xref ref-type="aff" rid="aff15"><sup>15</sup></xref>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; original draft" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-original-draft/">Writing &#x2013; original draft</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &amp; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &#x0026; editing</role>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Wu</surname>
<given-names>Youyou</given-names>
</name>
<xref ref-type="aff" rid="aff27"><sup>27</sup></xref>
<uri xlink:href="https://loop.frontiersin.org/people/2025964"/>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; original draft" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-original-draft/">Writing &#x2013; original draft</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &amp; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &#x0026; editing</role>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Zheng</surname>
<given-names>Yuan</given-names>
</name>
<xref ref-type="aff" rid="aff28"><sup>28</sup></xref>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; original draft" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-original-draft/">Writing &#x2013; original draft</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &amp; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &#x0026; editing</role>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Hemment</surname>
<given-names>Drew</given-names>
</name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="aff" rid="aff29"><sup>29</sup></xref>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; original draft" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-original-draft/">Writing &#x2013; original draft</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &amp; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &#x0026; editing</role>
</contrib>
</contrib-group>
<aff id="aff1"><label>1</label><institution>The Alan Turing Institute</institution>, <city>London</city>, <country country="gb">United Kingdom</country></aff>
<aff id="aff2"><label>2</label><institution>Queen Mary University of London</institution>, <city>London</city>, <country country="gb">United Kingdom</country></aff>
<aff id="aff3"><label>3</label><institution>University of Colorado</institution>, <city>Boulder</city>, <state>CO</state>, <country country="us">United States</country></aff>
<aff id="aff4"><label>4</label><institution>University of Nottingham</institution>, <city>Nottingham</city>, <country country="gb">United Kingdom</country></aff>
<aff id="aff5"><label>5</label><institution>King&#x2019;s College London</institution>, <city>London</city>, <country country="gb">United Kingdom</country></aff>
<aff id="aff6"><label>6</label><institution>Sorbonne Universit&#x00E9;</institution>, <city>Paris</city>, <country country="fr">France</country></aff>
<aff id="aff7"><label>7</label><institution>Durham University</institution>, <city>Durham</city>, <country country="gb">United Kingdom</country></aff>
<aff id="aff8"><label>8</label><institution>University of Edinburgh</institution>, <city>Edinburgh</city>, <country country="gb">United Kingdom</country></aff>
<aff id="aff9"><label>9</label><institution>Dartmouth College</institution>, <city>Hanover</city>, <state>NH</state>, <country country="us">United States</country></aff>
<aff id="aff10"><label>10</label><institution>Gibran AI</institution>, <city>London</city>, <country country="gb">United Kingdom</country></aff>
<aff id="aff11"><label>11</label><institution>University of Coventry</institution>, <city>Coventry</city>, <country country="gb">United Kingdom</country></aff>
<aff id="aff12"><label>12</label><institution>Technische Universit&#x00E4;t Darmstadt</institution>, <city>Darmstadt</city>, <country country="de">Germany</country></aff>
<aff id="aff13"><label>13</label><institution>University of Cambridge</institution>, <city>Cambridge</city>, <state>MA</state>, <country country="us">United States</country></aff>
<aff id="aff14"><label>14</label><institution>McGill University</institution>, <city>Montreal</city>, <state>QC</state>, <country country="ca">Canada</country></aff>
<aff id="aff15"><label>15</label><institution>Cornell University</institution>, <city>Ithaca</city>, <state>NY</state>, <country country="us">United States</country></aff>
<aff id="aff16"><label>16</label><institution>University of Utah</institution>, <city>Salt Lake City</city>, <state>UT</state>, <country country="us">United States</country></aff>
<aff id="aff17"><label>17</label><institution>University of Chicago</institution>, <city>Chicago</city>, <state>IL</state>, <country country="us">United States</country></aff>
<aff id="aff18"><label>18</label><institution>Princeton University</institution>, <city>Princeton</city>, <state>NJ</state>, <country country="us">United States</country></aff>
<aff id="aff19"><label>19</label><institution>London School of Economics</institution>, <city>London</city>, <country country="gb">United Kingdom</country></aff>
<aff id="aff20"><label>20</label><institution>University of Southampton</institution>, <city>Southampton</city>, <country country="gb">United Kingdom</country></aff>
<aff id="aff21"><label>21</label><institution>Rice University</institution>, <city>Houston</city>, <state>TX</state>, <country country="us">United States</country></aff>
<aff id="aff22"><label>22</label><institution>University of Glasgow</institution>, <city>Glasgow</city>, <country country="gb">United Kingdom</country></aff>
<aff id="aff23"><label>23</label><institution>Cardiff University</institution>, <city>Cardiff</city>, <country country="gb">United Kingdom</country></aff>
<aff id="aff24"><label>24</label><institution>University of Exeter</institution>, <city>Exeter</city>, <country country="gb">United Kingdom</country></aff>
<aff id="aff25"><label>25</label><institution>University of Brighton</institution>, <city>Brighton</city>, <country country="gb">United Kingdom</country></aff>
<aff id="aff26"><label>26</label><institution>University of Illinois Urbana-Champaign</institution>, <city>Champaign</city>, <state>IL</state>, <country country="us">United States</country></aff>
<aff id="aff27"><label>27</label><institution>University College London</institution>, <city>London</city>, <country country="gb">United Kingdom</country></aff>
<aff id="aff28"><label>28</label><institution>University of Sheffield</institution>, <city>Sheffield</city>, <country country="gb">United Kingdom</country></aff>
<aff id="aff29"><label>29</label><institution>University of Edinburgh</institution>, <city>Edinburgh</city>, <country country="gb">United Kingdom</country></aff>
<author-notes><corresp id="c001"><label>&#x002A;</label>Correspondence: Cody Kommers, <email xlink:href="mailto:ckommers@turing.ac.uk">ckommers@turing.ac.uk</email></corresp></author-notes>
<pub-date publication-format="electronic" date-type="pub" iso-8601-date="2026-02-26">
<day>26</day>
<month>02</month>
<year>2026</year>
</pub-date>
<pub-date publication-format="electronic" date-type="collection">
<year>2026</year>
</pub-date>
<volume>9</volume>
<elocation-id>1753041</elocation-id>
<history>
<date date-type="received">
<day>24</day>
<month>11</month>
<year>2025</year>
</date>
<date date-type="rev-recd">
<day>03</day>
<month>02</month>
<year>2026</year>
</date>
<date date-type="accepted">
<day>06</day>
<month>02</month>
<year>2026</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#x00A9; 2026 Kommers, Ahnert, Antoniak, Benetos, Benford, Bunz, Caramiaux, Concannon, Disley, Dobson, Du, Du&#x00E9;&#x00F1;ez-Guzm&#x00E1;n, Francksen, Gius, Gray, Heuser, Immel, So, Leigh, Livingston, Long, Martin, Meyer, Mihai, Noel-Hirst, Ostherr, Parker, Qin, Ratcliff, Robinson, Rodriguez, Sobey, Underwood, Vashistha, Wilkens, Wu, Zheng and Hemment.</copyright-statement>
<copyright-year>2026</copyright-year>
<copyright-holder>Kommers, Ahnert, Antoniak, Benetos, Benford, Bunz, Caramiaux, Concannon, Disley, Dobson, Du, Du&#x00E9;&#x00F1;ez-Guzm&#x00E1;n, Francksen, Gius, Gray, Heuser, Immel, So, Leigh, Livingston, Long, Martin, Meyer, Mihai, Noel-Hirst, Ostherr, Parker, Qin, Ratcliff, Robinson, Rodriguez, Sobey, Underwood, Vashistha, Wilkens, Wu, Zheng and Hemment</copyright-holder>
<license>
<ali:license_ref start_date="2026-02-26">https://creativecommons.org/licenses/by/4.0/</ali:license_ref>
<license-p>This is an open-access article distributed under the terms of the <ext-link ext-link-type="uri" xlink:href="https://creativecommons.org/licenses/by/4.0/">Creative Commons Attribution License (CC BY)</ext-link>. The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</license-p>
</license>
</permissions>
<abstract>
<p>Generative AI (GenAI) systems are increasingly recognized as cultural technologies, yet current evaluation frameworks often treat culture as a variable to be measured rather than fundamental to the system's operation. Drawing on hermeneutic theory from the humanities, we argue that GenAI systems function as "context machines" that must inherently address three interpretive challenges: situatedness (meaning only emerges in context), plurality (multiple valid interpretations coexist), and ambiguity (interpretations naturally conflict). We present computational hermeneutics as an emerging framework offering an interpretive account of what GenAI systems do, and how they might do it better. We offer three principles for hermeneutic evaluation&#x2014;that benchmarks should be iterative, not one-off; include people, not just machines; and measure cultural context, not just model output. This perspective offers a nascent paradigm for designing and evaluating contemporary AI systems: shifting from standardized questions about accuracy to contextual ones about meaning.</p>
</abstract>
<kwd-group>
<kwd>culture</kwd>
<kwd>GenAI</kwd>
<kwd>interpretation</kwd>
<kwd>meaning</kwd>
<kwd>societal impact</kwd>
</kwd-group><funding-group><funding-statement>The author(s) declared that financial support was received for this work and/or its publication. This work was supported by the Alan Turing Institute under Lloyd&#x2019;s Register Foundation grant ATI/100004. This work also supported by the Arts and Humanities Research Council UK.</funding-statement></funding-group>
<counts>
<fig-count count="0"/>
<table-count count="0"/>
<equation-count count="0"/>
<ref-count count="117"/>
<page-count count="9"/>
<word-count count="9466"/>
</counts>
<custom-meta-group>
<custom-meta>
<meta-name>section-at-acceptance</meta-name>
<meta-value>Machine Learning and Artificial Intelligence</meta-value>
</custom-meta>
</custom-meta-group>
</article-meta>
</front>
<body>
<sec sec-type="intro" id="sec1">
<label>1</label>
<title>Introduction</title>
<p>Generative AI (GenAI) systems are cultural and social technologies (<xref ref-type="bibr" rid="ref4">Bender et al., 2021</xref>; <xref ref-type="bibr" rid="ref33">Farrell et al., 2025</xref>; <xref ref-type="bibr" rid="ref51">Klein et al., 2025</xref>; <xref ref-type="bibr" rid="ref96">Sorensen et al., 2024</xref>). Every aspect of these systems&#x2014;from the social data they are trained on, to the benchmarks by which they are evaluated, to the societal effects of their outputs&#x2014;depends on the complex web of norms, assumptions, meanings, practices, and social dynamics that make up culture and context. Their development is both influenced by culture (e.g., drawing on data reflecting perspectives from 21st century internet culture, while having been developed by engineers operating in a particular milieu) and in turn influences culture (e.g., shaping the kind of content people create and consume, while integrating into an ever-expanding set of production pipelines across society).</p>
<p>While this position is increasingly accepted as orthodoxy within the field of AI, it can rely on a limited definition of culture. In practice culture is often treated as a secondary consideration, like a coat of paint or dash of seasoning that modifies the more &#x201C;fundamental&#x201D; aspects of the model: for example, as a bias to debug (<xref ref-type="bibr" rid="ref9">Bolukbasi et al., 2016</xref>; <xref ref-type="bibr" rid="ref102">Tao et al., 2024</xref>), a constraint for generalizing from one context to another (<xref ref-type="bibr" rid="ref115">Yong Cao et al., 2023</xref>), a parameter in an ethical dilemma (<xref ref-type="bibr" rid="ref28">Freitas et al., 2021</xref>), or a source of variability in user preferences (<xref ref-type="bibr" rid="ref38">Ge et al., 2024</xref>). These approaches operationalize culture as a variable to be measured&#x2014;often implying that it is an optional parameter to include in model evaluation, rather than a foundational aspect of the model&#x2019;s functioning.</p>
<p>However, the most prominent frontier models&#x2014;many of which not only power popular general-purpose AI systems (e.g., ChatGPT, Gemini) but also underlie task-specific applications (e.g., Microsoft Copilot, Notion)&#x2014;are not specialized systems designed to solve targeted, well-defined tasks. They are designed, and often marketed, as general systems built to generate a variety of cultural artifacts in a vast space of possible contexts. Cultural considerations are inextricable both from how these models are developed and from the open-ended, dialogic interfaces in which they are used. It is therefore crucial that we ask: How can we most effectively evaluate GenAI as a cultural technology?</p>
<p>In this Perspective, we offer an account of culture informed by the humanities. We argue that evaluation methods in AI often overlook an important conception of culture: not as a variable to be measured, but as a dynamic, contested space where social meaning is made (<xref ref-type="bibr" rid="ref39">Geertz, 1973</xref>; <xref ref-type="bibr" rid="ref40">Hall, 1997</xref>; <xref ref-type="bibr" rid="ref51">Klein et al., 2025</xref>). This way of looking at culture challenges a core assumption in standard practices for AI benchmarking&#x2014;that model performance is best understood through universal, standardized tasks with convergent solutions or goals (<xref ref-type="bibr" rid="ref82">Raji et al., 2021</xref>). While this approach works for well-defined tasks where &#x201C;success&#x201D; can be codified into a single, unique interpretation, culture is not this kind of task.</p>
<p>To illustrate the challenge of evaluating cultural outputs, consider the act of writing a letter, painting a portrait, composing a song, cooking a meal, penning a journal entry, or even talking with a friend. While it is possible to assign a quantitative score to these outputs to describe how well the task was performed, that approach can miss the point of these activities in crucial ways. For example, reducing cultural activities to a set of proxy variables can trivialize them (<xref ref-type="bibr" rid="ref117">Zhou et al., 2025</xref>), while scalable &#x201C;thin&#x201D; metrics are often insufficient to capture key aspects of what makes them meaningful (<xref ref-type="bibr" rid="ref55">Kommers et al., 2025b</xref>). The structure of these tasks is such that the primary question is not about assessing how closely they cleave to a canonical ground truth. Rather it is about arbitrating among multiple, possibly conflicting, interpretations of their meaning within a specific frame of reference. This requires us to think about culture as an intrinsically different kind of &#x201C;task&#x201D; from those by which a model&#x2019;s performance has traditionally been judged.</p>
<p>Our position is that, as AI systems are increasingly deployed to (co-)produce cultural outputs, it is imperative that our methods of evaluation reflect the interpretive dimensions needed to characterize them more fully. To address this, we introduce hermeneutics&#x2014;a core tradition in the humanities concerned with the theory and practice of interpretation&#x2014;as a theoretical foundation for understanding and evaluating GenAI systems (<xref ref-type="bibr" rid="ref72">Mohr et al., 2015</xref>; <xref ref-type="bibr" rid="ref85">Rebera et al., 2025</xref>; <xref ref-type="bibr" rid="ref90">Romele et al., 2020</xref>). Having grappled with these questions for decades, if not centuries, the conceptual infrastructure of the humanities (via hermeneutics) can help articulate the grounds on which a given interpretation can be considered legitimate. Providing such an account of the interpretive nature of GenAI systems is a crucial step toward improving the way we design and evaluate them.</p>
<p>Thus, we present computational hermeneutics as an emerging framework offering an interpretive approach to the evaluation of GenAI systems. We argue that GenAI can, and should, be understood as &#x201C;doing&#x201D; interpretation in ways that reflect the entanglement of culture in their input, processes, and outputs. We use this active phrasing&#x2014;to &#x201C;do&#x201D; interpretation&#x2014;to reflect the fact that interpretive considerations are inextricably bound up in the processes and structures underlying these systems. The data, architecture, and algorithms of these systems are not static mirrors reflecting back invariant, disinterested projections of the world. They must be understood as comprising interpretive stakes, decisions, and processes. On the other hand, it is nonetheless crucial to recognize that GenAI do not &#x201C;do&#x201D; interpretation in the same way as humans and to avoid unduly imbuing them with anthropomorphic intentions (<xref ref-type="bibr" rid="ref22">DeVrio et al., 2025</xref>; <xref ref-type="bibr" rid="ref1">Akbulut et al., 2024</xref>).</p>
<p>With this in mind, we offer three hermeneutic challenges that are inherent to such interpretive processes: situatedness, plurality, and ambiguity. Each of these already exists in one form or another in contemporary AI (<xref ref-type="bibr" rid="ref12">Akbulut et al., 2025</xref>; <xref ref-type="bibr" rid="ref57">Lazar and Nelson, 2023</xref>; <xref ref-type="bibr" rid="ref96">Sorensen et al., 2024</xref>). We further this existing work by suggesting how these challenges can be brought together within a hermeneutic frame. Finally, we offer three principles for developing hermeneutic methods of evaluating GenAI: that benchmarks should be iterative, not one-off; include people, not just machines; and measure cultural context, not just model output.</p>
</sec>
<sec id="sec2">
<label>2</label>
<title>Computational hermeneutics</title>
<p>Interpretation is the methodological bedrock of the humanities (<xref ref-type="bibr" rid="ref39">Geertz, 1973</xref>). Generally speaking, what humanists do when studying cultural artifacts&#x2014;whether a novel, historical event, or painting&#x2014;is to construct an interpretation: an analysis of that artifact&#x2019;s meaning within its social or historical context. But this approach comes with an inherent challenge. How do we know whether a given interpretation is a good one? Hermeneutics is the method, justification, or separate interpretive process which gives credence or legitimacy to the original interpretation (<xref ref-type="bibr" rid="ref13">Caputo, 2018</xref>; <xref ref-type="bibr" rid="ref88">Ricoeur, 1981</xref>). This concept is foundational across many disciplines and practices, from legal and literary studies (<xref ref-type="bibr" rid="ref59">Levinson and Mailloux, 1988</xref>; <xref ref-type="bibr" rid="ref100">Szondi, 1995</xref>) to debates in philosophy and aesthetics (<xref ref-type="bibr" rid="ref91">Rosen, 2003</xref>; <xref ref-type="bibr" rid="ref95">Simpson, 2020</xref>). It arises, in one form or another, whenever scholars confront epistemological problems of meaning.</p>
<p>A core concept within this tradition is the &#x201C;hermeneutic circle&#x201D; (<xref ref-type="bibr" rid="ref23">Dilthey, 1989</xref>; <xref ref-type="bibr" rid="ref36">Gadamer, 1960</xref>; <xref ref-type="bibr" rid="ref42">Heidegger, 1927</xref>; <xref ref-type="bibr" rid="ref93">Schleiermacher, 1998</xref>). This describes the interpretation of an artifact as an iterative process between understanding the meaning of a specific part of the artifact and the meaning of the artifact as a whole. For example, one could iteratively analyze the imagery depicted in a given line or stanza of a poem, then update one&#x2019;s conception about what the poem means in general&#x2014;each time using the updated general theory to analyze the specific line, and vice versa. While the term is varied in its usage, what it typically means to analyze something hermeneutically is to engage in (and provide an account of) this iterative process of interpretation.</p>
<p>As applied to contemporary AI, we offer a notion of computational hermeneutics in two senses. The first sense is that AI models are fundamentally interpretive in a way that makes hermeneutic problems unavoidable; these challenges are intrinsic to GenAI&#x2019;s flexible production of sophisticated cultural artifacts such as texts and images. To categorize their outputs as binary &#x201C;right&#x201D; or &#x201C;wrong&#x201D; responses presents a similar profile of problems as asking whether <italic>Anna Karenina</italic> is a superior novel to <italic>Jane Eyre</italic>, whether the spiritual life prescribed in Laozi&#x2019;s <italic>Tao Te Ching</italic> is the right one, or whether Andy Warhol&#x2019;s soup can paintings were a critique, rather than a celebration, of American consumerism. Judgments on these matters are possible, but they depend crucially on the underlying assumptions of one&#x2019;s interpretive processes.</p>
<p>The second sense is that interpretive evaluation requires us to look at both specific and general aspects of the models, in the tradition of the hermeneutic circle. These models have both a general architecture (e.g., pre-training, vector representations, fine-tuning), as well as specific dialogic interactions with human users (e.g., context windows, prompts). We must look at both the system-level and context-specific generalizations in interpreting the outputs of these models. Roughly speaking, partial analysis maps onto the &#x201C;Chat&#x201D; in ChatGPT, while holistic analysis maps onto the &#x201C;GPT.&#x201D; Though these separate parts are interrelated, it is crucial to draw distinctions required for the evaluation of each on their own terms (<xref ref-type="bibr" rid="ref24">Dobson, 2019</xref>; <xref ref-type="bibr" rid="ref89">Ringler, 2024</xref>).</p>
<sec id="sec3">
<label>2.1</label>
<title>Hermeneutic challenges for AI</title>
<p>With this framing in mind, we present three hermeneutic challenges for GenAI: situatedness, plurality, and ambiguity. Each of these challenges take aspects of a model that may seem arbitrary, peripheral, or in need of optimization&#x2014;and re-centers those apparently accidental features as significant choices worthy of theoretical reflection. We take addressing these challenges to be the main difference between accounting for culture as a variable versus culture as a site of social meaning-making.</p>
<sec id="sec4">
<label>2.1.1</label>
<title>Situatedness: meaning only emerges in context</title>
<p>A core principle across many (if not all) of the humanities is that context is key. What this expresses, typically, is that to interpret the meaning of a cultural artifact, one must look at the historical or social context in which it has been made, used, or perceived (<xref ref-type="bibr" rid="ref36">Gadamer, 1960</xref>). For example, a contemporary reader of <italic>Huckleberry Finn</italic> will inevitably have a different relation to the text from a reader in the 19th century America of the book&#x2019;s original publication. When the frame of reference shifts, so does the meaning. Cultural products are always generated within the bounds of a particular historical, cultural, or communicative context. This is the &#x201C;situatedness&#x201D; of meaning: an interpretation always takes a particular point of view, even if that perspective is only stated implicitly.</p>
<p>It can be easy to overlook this in contemporary AI interfaces, which often present the model as speaking from a god&#x2019;s eye point of view&#x2014;that of the disembodied model which has seen, read, and synthesized more information than any one human ever could (<xref ref-type="bibr" rid="ref43">Hemment et al., 2025</xref>). No such epistemically totalitarian &#x201C;view from nowhere&#x201D; exists in any legitimate sense (<xref ref-type="bibr" rid="ref41">Haraway, 1988</xref>). Within a hermeneutic frame, the point is not to build and evaluate models that aim to achieve this universal, monolithic perspective. Rather it is for the specific perspective being offered to be clearly identified and understood as just that: a specific perspective. For example, recent work has empirically demonstrated how GenAI systems can collapse perspectives into an idealized form, showing how further mechanisms are needed to maintain the individuation of distinct perspectives (<xref ref-type="bibr" rid="ref45">Heuser, 2025</xref>).</p>
</sec>
<sec id="sec5">
<label>2.1.2</label>
<title>Plurality: one person&#x2019;s bias is another person&#x2019;s values</title>
<p>Interpretation is inherently plural, because different communities rely on distinct frameworks for making sense of the world. What appears as meaningful artistic expression to one group may seem inappropriate or offensive to another; what counts as authoritative fact in one tradition may be dismissed as unsubstantiated assertion in another. As is widely held in the humanities, multiple valid interpretations can coexist without requiring resolution into a single &#x201C;correct&#x201D; reading. Any AI model intended for use in different cultural contexts must grapple with the observation that what looks like arbitrary cultural bias from one perspective is often the same thing that gives a sense of meaning and value in another.</p>
<p>AI systems face this challenge directly because they serve users with distinct values while being trained on materials whose authors often disagree. Generative models are therefore both one and many: reflecting specific curatorial decisions, but also containing contradictory voices (<xref ref-type="bibr" rid="ref21">Desai et al., 2024</xref>; <xref ref-type="bibr" rid="ref94">Sharma et al., 2024</xref>; <xref ref-type="bibr" rid="ref110">Veselovsky et al., 2025b</xref>). Recent work on pluralistic, thick, or full-stack alignment recognizes that human values naturally conflict and advocates for systems that can accommodate this diversity (<xref ref-type="bibr" rid="ref57">Lazar and Nelson, 2023</xref>; <xref ref-type="bibr" rid="ref63">Lowe et al., 2025</xref>; <xref ref-type="bibr" rid="ref96">Sorensen et al., 2024</xref>). However, while pluralistic alignment focuses on adjusting model behavior to reflect different values, the deeper challenge lies in how we evaluate such systems. Standard evaluation frameworks assume convergent solutions&#x2014;that there is a standard candle against which model performance can be definitively compared. Cultural tasks, by contrast, do not converge to single solutions: success cannot be determined by proximity to a ground truth but must account for the legitimacy of multiple interpretations within their respective contexts. This requires fundamentally rethinking evaluation from measuring accuracy to assessing appropriateness across different cultural frameworks (<xref ref-type="bibr" rid="ref58">Leibo et al., 2024</xref>). For example, what is viewed as AI &#x201C;slop&#x201D; in one context may be valued as a legitimate source of meaning or seen as having aesthetic resonance in another (<xref ref-type="bibr" rid="ref54">Kommers et al., 2025a</xref>).</p>
</sec>
<sec id="sec6">
<label>2.1.3</label>
<title>Ambiguity: interpretations naturally conflict</title>
<p>In hermeneutics, meaning is not something that exists as a fixed property of a text or cultural artifact, inertly awaiting discovery. Rather, meaning emerges through what Gadamer calls the &#x201C;fusion of horizons&#x201D;&#x2014;the dynamic interaction between the interpreter&#x2019;s background and the artifact being interpreted (<xref ref-type="bibr" rid="ref36">Gadamer, 1960</xref>). This process is intrinsically ambiguous. The space of possible mappings between potentially relevant features of the interpreter&#x2019;s background and the artifact is combinatorially large, and therefore a definitive interpretation is not computationally tractable. To offer a particular kind of interpretation (e.g., feminist, post-colonial, techno-optimist) is to ease this intractability by specifying an <italic>a priori</italic> constraint on which features to consider. More generally, Gadamer emphasizes the role of &#x201C;play&#x201D; in interpretation&#x2014;that creative, open-ended consideration of tensions between different meanings offers a way of exploring this space of interpretive possibilities. It is therefore crucial that ambiguity be maintained in articulating this interpretive space, rather than being flattened into a specific mode of interpretation.</p>
<p>Ambiguity has long been of interest in AI, often with the goal of resolving it (<xref ref-type="bibr" rid="ref74">Navigli, 2009</xref>). Semantic disambiguation tasks, for instance, aim to determine which meaning of a polysemous word is intended in a given context&#x2014;clarifying whether &#x201C;light&#x201D; is used to signify illumination or weight. Such tasks are crucial for many applications, but they represent only one way of engaging with ambiguity. When AI systems generate cultural outputs&#x2014;whether composing poetry, engaging in dialog, or creating visual art&#x2014;the goal is not necessarily to eliminate semantic uncertainty but to work productively within it (<xref ref-type="bibr" rid="ref37">Gaver et al., 2003</xref>). A poem that resolves all its ambiguities loses much of its interpretive richness; a conversation that admits only one reading of each utterance becomes sterile (<xref ref-type="bibr" rid="ref29">Empson, 1930</xref>). However, current evaluation frameworks often treat this ambiguity as noise to be minimized rather than a generative resource (<xref ref-type="bibr" rid="ref113">Yadav et al., 2021</xref>). While semantic disambiguation tasks can be useful, elimination of ambiguity is not the only&#x2014;or even the primary&#x2014;goal when it comes to cultural outputs. Instead, evaluation should assess how well systems navigate ambiguity productively, maintaining the interpretive flexibility that enables meaningful cultural engagement across diverse contexts (<xref ref-type="bibr" rid="ref58">Leibo et al., 2024</xref>; <xref ref-type="bibr" rid="ref109">Veselovsky et al., 2025a</xref>). For example, recent approaches have sought to tease out the inherently multiplicitous perspectives contained within GenAI systems, developing processes for negotiating among conflicting viewpoints held within the model architecture (<xref ref-type="bibr" rid="ref60">Li et al., 2024</xref>).</p>
</sec>
</sec>
</sec>
<sec id="sec7">
<label>3</label>
<title>Generative AI systems as &#x201C;context machines&#x201D;</title>
<p>In this section, we argue that GenAI systems &#x201C;do&#x201D; interpretation as a fundamental capacity (<xref ref-type="bibr" rid="ref25">Dobson, 2022</xref>)&#x2014;and therefore evaluation of their performance is subject to the three hermeneutic challenges described above. Even so, it is important to note that the interpretive processes underlying these systems are distinct from those of human interpreters (<xref ref-type="bibr" rid="ref81">Placani, 2024</xref>); while conversational systems may superficially adopt the voice of a human perspective, they should not be mistaken as inveterately human (<xref ref-type="bibr" rid="ref80">Peter et al., 2025</xref>). For instance, such interpretive processes take place both internally within a model, as well as dialogically in their interactions with people. Providing a more comprehensive account of the interpretive nature of these systems is a crucial step toward improving the way we design and evaluate them.</p>
<p>We posit that GenAI systems can be broadly understood as &#x201C;context machines.&#x201D; At core, GenAI systems are designed to answer the question: given the current context, what is the next relevant token, pixel, or other value? This ability to consolidate a broader set of contextual cues into a unified representation is supported by a variety of architectural features&#x2014;but most notably by vector space embeddings (<xref ref-type="bibr" rid="ref31">Ethayarajh, 2019</xref>; <xref ref-type="bibr" rid="ref56">Kozlowski et al., 2019</xref>; <xref ref-type="bibr" rid="ref99">Stoltz and Taylor, 2021</xref>). Such embeddings are a means of encoding highly sophisticated co-occurrence statistics (<xref ref-type="bibr" rid="ref105">Turney and Pantel, 2010</xref>). In language models, they are learned by poring over vast corpora of text (<xref ref-type="bibr" rid="ref70">Mikolov et al., 2013</xref>; <xref ref-type="bibr" rid="ref79">Pennington et al., 2014</xref>). In vision models, vectors of pixel values are often encoded as feature maps capturing edges, textures, and semantic patterns (<xref ref-type="bibr" rid="ref5">Bengio et al., 2012</xref>; <xref ref-type="bibr" rid="ref68">Mihai and Hare, 2021</xref>). Decoding these embeddings is also an interpretive act. This process is often probabilistic, accommodating a plurality of possible interpretations (<xref ref-type="bibr" rid="ref48">James et al., 2013</xref>; <xref ref-type="bibr" rid="ref114">Yang et al., 2023</xref>). Informally, these vectors are designed to capture the &#x201C;meaning&#x201D; of words or images; more concretely, they are a highly nuanced way of describing the context in which a word is likely to occur.</p>
<p>Generative models work as well as they do because (as is a common refrain in the humanities) context matters&#x2014;so much so that if you get it right, a lot of other important things follow. Vector space embeddings are therefore subject to a similar question as humanistic inquiry: How do we know whether a given interpretation, as encoded by an embedding, is a good one? Accordingly, GenAI systems are faced with the three hermeneutic challenges described above: the outputs of these systems are situated (the &#x201C;meaning&#x201D; of one token is defined relationally within the context of other tokens); plural (there are multiple legitimate interpretations of what counts as the next most likely token); and ambiguous (the probabilistic decoding process maintains rather than resolves semantic uncertainty).</p>
<p>Our position is that Generative AI systems both &#x201C;do&#x201D; interpretation, and that they can do it better. For example, the self-attention mechanism of the transformer architecture can be read as a way of relating partial and holistic interpretations (<xref ref-type="bibr" rid="ref108">Vaswani et al., 2017</xref>). It allows the model to iteratively update its understanding of individual tokens based on their relationship to the broader sequence, and vice versa&#x2014;in other words, the hermeneutic circle in action.</p>
<sec id="sec8">
<label>3.1</label>
<title>AI systems do not just &#x201C;read in&#x201D; context; they help create it</title>
<p>Interpretation does not only occur in isolation within GenAI models; these systems also co-construct interpretations in collaboration with humans (<xref ref-type="bibr" rid="ref34">Frauenberger, 2019</xref>). A hermeneutic perspective on AI is not just about building systems that can interpret like humans, as a substitute or proxy for human expertise. Rather it is about recognizing how interpretation itself emerges through interaction between humans and machines. In this view, interpretive capacity arises not only within the model but through the design of interactions and interfaces that frame it.</p>
<p>The effects of this collaboration are bidirectional. From human to machine, people decide what data the systems are trained on (<xref ref-type="bibr" rid="ref21">Desai et al., 2024</xref>); formulate objective functions that reflect a specific set of goals, values, and assumptions (<xref ref-type="bibr" rid="ref57">Lazar and Nelson, 2023</xref>); fine-tune system behavior through mechanisms like reinforcement learning from human feedback (<xref ref-type="bibr" rid="ref78">Ouyang et al., 2022</xref>); and &#x201C;engineer&#x201D; prompts in order to elicit certain kinds of responses (<xref ref-type="bibr" rid="ref17">Chen et al., 2025</xref>). At multiple layers of the system, human annotators&#x2014;who can themselves offer conflicting interpretations (<xref ref-type="bibr" rid="ref35">Frenda et al., 2024</xref>)&#x2014;can provide feedback on ambiguous cases, rank responses, or supply preference scores, effectively staging a dialog where the AI&#x2019;s provisional interpretations can be contested and refined.</p>
<p>From machine to human, AI systems affect important mental capacities like metacognition (<xref ref-type="bibr" rid="ref101">Tankelevitch et al., 2024</xref>); elicit different assumptions about relational norms [e.g., AI as assistant vs. therapist (<xref ref-type="bibr" rid="ref27">Earp et al., 2025</xref>)]; act as thought-partners, for example by summarizing documents people would otherwise have to read&#x2014;or skim&#x2014;in full (<xref ref-type="bibr" rid="ref19">Collins et al., 2024</xref>); shape human responses by explaining their own decisions (<xref ref-type="bibr" rid="ref26">Doshi-Velez and Kim, 2017</xref>); and enable novel kinds of experience, such as certain creative practices (<xref ref-type="bibr" rid="ref14">Caramiaux and Fdili Alaoui, 2022</xref>; <xref ref-type="bibr" rid="ref44">Hemment et al., 2024</xref>; <xref ref-type="bibr" rid="ref73">Murray-Browne and Tigas, 2021</xref>). Examples of how this approach has been employed include applications of assemblage thinking to study how AI is deployed (<xref ref-type="bibr" rid="ref104">Tseng, 2023</xref>), as well as design frameworks that incorporate interpretive practices into multiple steps of the development process (<xref ref-type="bibr" rid="ref2">Andres et al., 2025</xref>). Together, humans and GenAI systems form an interpretive feedback loop. Far from a separate isolated entity that the system merely &#x201C;reads in,&#x201D; AI systems can exert a direct influence on the cultural context in which they operate.</p>
</sec>
</sec>
<sec id="sec9">
<label>4</label>
<title>Operationalizing hermeneutics in AI</title>
<p>Typically, AI benchmarking assumes universal, standardized tasks with convergent solutions (<xref ref-type="bibr" rid="ref16">Chang et al., 2024</xref>; <xref ref-type="bibr" rid="ref30">Eriksson et al., 2025</xref>; <xref ref-type="bibr" rid="ref82">Raji et al., 2021</xref>)&#x2014;an approach fundamentally at odds with a hermeneutic perspective on culture. While benchmarks are key drivers of progress in AI, they often do not offer especially strong standards for what they purport to measure (<xref ref-type="bibr" rid="ref50">Kapoor et al., 2024</xref>; <xref ref-type="bibr" rid="ref66">McIntosh et al., 2025</xref>; <xref ref-type="bibr" rid="ref87">Reuel-Lamparth et al., 2024</xref>; <xref ref-type="bibr" rid="ref92">Schlangen, 2021</xref>). Furthermore, the implicit goal of benchmarking is often not to develop stronger metrics for specialized cases (though see <xref ref-type="bibr" rid="ref18">Chiu et al. (2024)</xref> and <xref ref-type="bibr" rid="ref106">Underwood et al. (2025)</xref>) but something more like one-task-suite-to-rule-them-all, a comprehensive assessment that would give an unequivocal, decisive answer to the question of which model is better at what <xref ref-type="bibr" rid="ref76">Norah Alzahrani et al. (2024)</xref>, <xref ref-type="bibr" rid="ref32">Ethayarajh and Jurafsky (2020)</xref>, <xref ref-type="bibr" rid="ref52">Koch and Peterson (2024)</xref>, <xref ref-type="bibr" rid="ref82">Raji et al. (2021)</xref>, and <xref ref-type="bibr" rid="ref97">Srivastava et al. (2023)</xref>.</p>
<p>Our hermeneutic framing challenges this paradigm by reimagining the kinds of questions that can be asked with AI benchmarks: shifting from standardized questions about accuracy to contextual ones about meaning. From this perspective, no such comprehensive task suite can be developed, because the &#x201C;task&#x201D; of creating cultural outputs means too many different things in too many different contexts. Attempts to standardize cultural production into a comprehensive assessment often seek to scrub away this context; we advocate that such context must be embraced. We offer three ways of making AI benchmarks that better reflect a hermeneutic lens on culture&#x2014;by making them iterative, not just one-off; including people, not just machines; and measuring cultural context, not just model output.</p>
<sec id="sec10">
<label>4.1</label>
<title>Benchmarks should be iterative, not just one-off</title>
<p>The hermeneutic circle suggests that interpretation depends on an iterative process between part and whole. By contrast, benchmarks typically apply a score&#x2014;often scalar values such as accuracy, precision, recall, F1, or BLEU scores (<xref ref-type="bibr" rid="ref16">Chang et al., 2024</xref>; <xref ref-type="bibr" rid="ref30">Eriksson et al., 2025</xref>)&#x2014;to quantify the model&#x2019;s performance in a given domain. Hermeneutics benchmarking suggests two modifications that can be made to this approach.</p>
<p>First, evaluation is both limited and unreliable when it scores performance based on a single prompt (<xref ref-type="bibr" rid="ref71">Mizrahi et al., 2024</xref>). By contrast, cultural outputs are always part of an evolving conversation, whether a literal dialog or as a part of a broader evolutionary process (<xref ref-type="bibr" rid="ref10">Brinkmann et al., 2023</xref>). Evaluation should accordingly be iterative, unfolding over multiple prompts or exchanges that reflect the evolving interpretive context.</p>
<p>Second, evaluation must take into account both the model as whole and the specific dialogic frame in which a given output is elicited. For example, the focus of benchmarking on aggregate metrics indicating average performance rather than instance-by-instance evaluations limits generalizability (<xref ref-type="bibr" rid="ref11">Burnell et al., 2023</xref>). Overall, hermeneutic evaluations should seek to iteratively assess both the model&#x2019;s holistic capabilities, as well as its behavior in specific circumstances.</p>
<p>Existing benchmarks have begun to incorporate multi-turn iterative processes into their evaluation practices. Notable examples include assessments of chatbot capabilities in more than a dozen distinct tasks which evaluate performance over the course of an interaction with a human interlocutor (<xref ref-type="bibr" rid="ref3">Bai et al., 2024</xref>), as well as assessments of perceived anthropomorphism in language models which show that the interpretation of model behavior as social (e.g., &#x201C;relationship building&#x201D; via empathic, emotionally-validating responses) only take place after multiple turns of interaction (<xref ref-type="bibr" rid="ref46">Ibrahim et al., 2025a</xref>).</p>
</sec>
<sec id="sec11">
<label>4.2</label>
<title>Benchmarks should include people, not just machines</title>
<p>The interpretive processes underlying GenAI are inextricably bound up in collaboration with the people using them (<xref ref-type="bibr" rid="ref67">Messeri and Crockett, 2024</xref>). Benchmarks should therefore not just consider AI performance in isolation but ought to also measure the effects of different interactive configurations. For example, current approaches to the assessment of creativity in narrative generation range from automated metrics to expert human judgment (<xref ref-type="bibr" rid="ref8">Boisson et al., 2025</xref>; <xref ref-type="bibr" rid="ref15">Chakrabarty et al., 2024</xref>; <xref ref-type="bibr" rid="ref65">Marco et al., 2025</xref>); but these often treat creativity as a model property rather than a relational phenomenon.</p>
<p>A hermeneutic approach would evaluate how human-AI collaboration produces interpretations, examining not just outputs but the interpretive dialog that generates them. This builds on a wide range of efforts in AI evaluation which increasingly recognize that benchmarks cannot be divorced from their communicative context (<xref ref-type="bibr" rid="ref18">Chiu et al., 2024</xref>; <xref ref-type="bibr" rid="ref20">Denton et al., 2020</xref>; <xref ref-type="bibr" rid="ref111">Weidinger et al., 2024</xref>; <xref ref-type="bibr" rid="ref112">Weidinger et al., 2023</xref>). Overall, hermeneutic evaluation requires benchmarks that assess interactivity rather than isolated performance, examining not just outputs but the interpretive dialog that generates them.</p>
<p>This practice is increasingly adopted in AI benchmarking. For example, assessments of harms from GenAI systems are sensitive to a larger range of potential issues&#x2014;such as social manipulation or cognitive overreliance&#x2014;only by evaluating the model capabilities in conjunction with their use by a human (<xref ref-type="bibr" rid="ref47">Ibrahim et al., 2025b</xref>). Likewise, a recent benchmark looking at cultural expectation incorporates over 10,000 human annotations, reflecting norms and judgments based on the lived experience of people from a given cultural domain (<xref ref-type="bibr" rid="ref75">Nayak et al., 2025</xref>).</p>
</sec>
<sec id="sec12">
<label>4.3</label>
<title>Benchmarks should measure cultural context, not just model output</title>
<p>Individual interpretations of meaning depend on cultural context (<xref ref-type="bibr" rid="ref53">Kommers and DeDeo, 2025</xref>)&#x2014;yet standard evaluation practices treat context as secondary to model performance metrics. Thin signals of like/dislike, positive/negative, or use/disuse cannot provide this contextual grounding (<xref ref-type="bibr" rid="ref55">Kommers et al., 2025b</xref>). Rather, we need hermeneutic approaches for putting contextual use cases on equal footing with general model capacities.</p>
<p>Partially, this is simply a suggestion to evaluate AI in the context in which it will be used (<xref ref-type="bibr" rid="ref12">Akbulut et al., 2025</xref>; <xref ref-type="bibr" rid="ref62">Liao and Xiao, 2023</xref>; <xref ref-type="bibr" rid="ref64">Malaviya et al., 2025</xref>; <xref ref-type="bibr" rid="ref67">Messeri and Crockett, 2024</xref>; <xref ref-type="bibr" rid="ref103">Tomaszewska and Biecek, 2024</xref>). For example, frameworks like HELM recognize the need for contextually dependent approaches beyond accuracy (<xref ref-type="bibr" rid="ref61">Liang et al., 2023</xref>). This can help address issues with current benchmarks, such as failure to capture real-world utility (<xref ref-type="bibr" rid="ref77">Ott et al., 2022</xref>), or by adapting general processes to better fit situational needs (<xref ref-type="bibr" rid="ref98">Staufer et al., 2025</xref>).</p>
<p>But more pointedly, digging deeper into contextualized scenarios allows us to probe different aspects of the model. Rather than asking whether a response is correct, hermeneutic evaluation can assess how and why a response achieves appropriateness within its specific cultural framework (<xref ref-type="bibr" rid="ref6">Bhutani et al., 2024</xref>; <xref ref-type="bibr" rid="ref58">Leibo et al., 2024</xref>). Evaluation must treat cultural context not as a constraint on model performance, but as the medium through which such performance emerges.</p>
<p>Some benchmarks are beginning to incorporate these kinds of contextual markers. For instance, a recent benchmark contrasts socio-cultural norms for Chinese vs. American viewers of AI-generated videos (<xref ref-type="bibr" rid="ref107">Varimalla et al., 2025</xref>). Similarly, a recent dataset organizes feedback from human raters based on demographic information, allowing for distinction in cultural judgments (<xref ref-type="bibr" rid="ref83">Rastogi et al., 2026</xref>). In summary, it is worth noting that the strongest of exemplars of hermeneutic evaluation tend to adopt all three recommendations: they are iterative, incorporate human participants, and sensitive to sociocultural variation.</p>
</sec>
</sec>
<sec sec-type="discussion" id="sec13">
<label>5</label>
<title>Discussion</title>
<p>Computational hermeneutics represents a potential shift in how we conceptualize GenAI systems. Rather than treating culture as a variable to be controlled or optimized away, we propose recognizing it as a foundational aspect of how these systems operate. This reframing transforms GenAI from answer-generating machines into interpretive partners&#x2014;systems designed to engage with the situatedness, plurality, and ambiguity that characterize individual and collective human meaning-making.</p>
<p>In this article, we have focused on the evaluation of GenAI systems via benchmarks. We offer this as a potentially effective means by which scholars with a humanistic background can help shape the direction of technical development in AI. Benchmarks are an important part of how the field of AI progresses and understands its own progress. However, in practice benchmarks often fall short of meaningfully assessing what they purport to measure (<xref ref-type="bibr" rid="ref50">Kapoor et al., 2024</xref>; <xref ref-type="bibr" rid="ref66">McIntosh et al., 2025</xref>; <xref ref-type="bibr" rid="ref87">Reuel-Lamparth et al., 2024</xref>; <xref ref-type="bibr" rid="ref92">Schlangen, 2021</xref>), and it is widely acknowledged that better benchmarks are needed to support ethical and effective development of AI (<xref ref-type="bibr" rid="ref7">Blagec et al., 2023</xref>; <xref ref-type="bibr" rid="ref86">Ren et al., 2024</xref>; <xref ref-type="bibr" rid="ref116">Zhao et al., 2025</xref>). One possible systemic cause of this is proxy failure (<xref ref-type="bibr" rid="ref49">John et al., 2024</xref>): that the field&#x2019;s monocultural overreliance on standardized performance metrics is inadequate to capture the kinds of things we really want AI to do (<xref ref-type="bibr" rid="ref52">Koch and Peterson, 2024</xref>; <xref ref-type="bibr" rid="ref55">Kommers et al., 2025b</xref>; <xref ref-type="bibr" rid="ref117">Zhou et al., 2025</xref>). This gives researchers with expertise in operationalizing tricky social or cultural concepts a useful lever for influencing this technology&#x2019;s metrics for success. But while we have focused on evaluation, this is not the only way to employ a hermeneutic perspective in AI. For example, on-going debates look at the cultural and social underpinnings of a model&#x2019;s training data (<xref ref-type="bibr" rid="ref69">Mihalcea et al., 2025</xref>; <xref ref-type="bibr" rid="ref84">Ravichander et al., 2025</xref>).</p>
<p>More generally, the hermeneutic tradition points to how powerful technological systems cannot be considered only in isolation, without appreciation of their environmental and societal consequences; this is a juncture at which crucial debates are being held and to which we hope a hermeneutic perspective can contribute. We offer the emerging framework of computational hermeneutics as a potential means of rethinking how we evaluate AI from the ground up&#x2014;as a set of technologies that does not just participate in culture by accident, but as systems which fundamentally shape, and are shaped by, cultural meaning.</p>
</sec>
</body>
<back>
<sec sec-type="data-availability" id="sec14">
<title>Data availability statement</title>
<p>The original contributions presented in the study are included in the article/supplementary material, further inquiries can be directed to the corresponding author/s.</p>
</sec>
<sec sec-type="author-contributions" id="sec15">
<title>Author contributions</title>
<p>CK: Writing &#x2013; original draft, Writing &#x2013; review &#x0026; editing. RA: Writing &#x2013; original draft, Writing &#x2013; review &#x0026; editing. MA: Writing &#x2013; review &#x0026; editing, Writing &#x2013; original draft. EB: Writing &#x2013; review &#x0026; editing, Writing &#x2013; original draft. SB: Writing &#x2013; review &#x0026; editing, Writing &#x2013; original draft. MB: Writing &#x2013; review &#x0026; editing, Writing &#x2013; original draft. BC: Writing &#x2013; review &#x0026; editing, Writing &#x2013; original draft. SC: Writing &#x2013; review &#x0026; editing, Writing &#x2013; original draft. MD: Writing &#x2013; review &#x0026; editing, Writing &#x2013; original draft. JD: Writing &#x2013; review &#x0026; editing, Writing &#x2013; original draft. YD: Writing &#x2013; review &#x0026; editing, Writing &#x2013; original draft. ED-G: Writing &#x2013; review &#x0026; editing, Writing &#x2013; original draft. KF: Writing &#x2013; review &#x0026; editing, Writing &#x2013; original draft. EG: Writing &#x2013; review &#x0026; editing, Writing &#x2013; original draft. JG: Writing &#x2013; original draft, Writing &#x2013; review &#x0026; editing. RH: Writing &#x2013; review &#x0026; editing, Writing &#x2013; original draft. SI: Writing &#x2013; review &#x0026; editing, Writing &#x2013; original draft. RS: Writing &#x2013; original draft, Writing &#x2013; review &#x0026; editing. SL: Writing &#x2013; review &#x0026; editing, Writing &#x2013; original draft. DL: Writing &#x2013; review &#x0026; editing, Writing &#x2013; original draft. HL: Writing &#x2013; original draft, Writing &#x2013; review &#x0026; editing. MM: Writing &#x2013; review &#x0026; editing, Writing &#x2013; original draft. GM: Writing &#x2013; review &#x0026; editing, Writing &#x2013; original draft. DM: Writing &#x2013; review &#x0026; editing, Writing &#x2013; original draft. AN-H: Writing &#x2013; review &#x0026; editing, Writing &#x2013; original draft. KO: Writing &#x2013; review &#x0026; editing, Writing &#x2013; original draft. DP: Writing &#x2013; original draft, Writing &#x2013; review &#x0026; editing. YQ: Writing &#x2013; review &#x0026; editing, Writing &#x2013; original draft. JR: Writing &#x2013; review &#x0026; editing, Writing &#x2013; original draft. ER: Writing &#x2013; original draft, Writing &#x2013; review &#x0026; editing. KR: Writing &#x2013; review &#x0026; editing, Writing &#x2013; original draft. AS: Writing &#x2013; original draft, Writing &#x2013; review &#x0026; editing. TU: Writing &#x2013; original draft, Writing &#x2013; review &#x0026; editing. AV: Writing &#x2013; review &#x0026; editing, Writing &#x2013; original draft. MW: Writing &#x2013; original draft, Writing &#x2013; review &#x0026; editing. YW: Writing &#x2013; original draft, Writing &#x2013; review &#x0026; editing. YZ: Writing &#x2013; original draft, Writing &#x2013; review &#x0026; editing. DH: Writing &#x2013; original draft, Writing &#x2013; review &#x0026; editing.</p>
</sec>
<ack>
<title>Acknowledgments</title>
<p>The authors wish to thank the reviewers who helped us present this material as clearly and effective as possible with their feedback.</p>
</ack>
<sec sec-type="COI-statement" id="sec17">
<title>Conflict of interest</title>
<p>The author(s) declared that this work was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
<p>The author YW declared that they were an editorial board member of Frontiers, at the time of submission. This had no impact on the peer review process and the final decision.</p>
</sec>
<sec sec-type="ai-statement" id="sec18">
<title>Generative AI statement</title>
<p>The author(s) declared that Generative AI was not used in the creation of this manuscript.</p>
<p>Any alternative text (alt text) provided alongside figures in this article has been generated by Frontiers with the support of artificial intelligence and reasonable efforts have been made to ensure accuracy, including review by the authors wherever possible. If you identify any issues, please contact us.</p>
</sec>
<sec sec-type="disclaimer" id="sec19">
<title>Publisher&#x2019;s note</title>
<p>All claims expressed in this article are solely those of the authors and do not necessarily represent those of their affiliated organizations, or those of the publisher, the editors and the reviewers. Any product that may be evaluated in this article, or claim that may be made by its manufacturer, is not guaranteed or endorsed by the publisher.</p>
</sec>
<ref-list>
<title>References</title>
<ref id="ref1"><mixed-citation publication-type="other"><person-group person-group-type="author"><name><surname>Akbulut</surname><given-names>C.</given-names></name> <name><surname>Weidinger</surname><given-names>L.</given-names></name> <name><surname>Manzini</surname><given-names>A.</given-names></name> <name><surname>Gabriel</surname><given-names>I.</given-names></name> <name><surname>Rieser</surname><given-names>V.</given-names></name></person-group> (<year>2024</year>). <article-title>All too human? Mapping and mitigating the risk from anthropomorphic AI</article-title>. In <source>Proceedings of the AAAI/ACM conference on AI, ethics, and society</source> (Vol. <volume>7</volume>. pp. <fpage>13</fpage>&#x2013;<lpage>26</lpage>).</mixed-citation></ref>
<ref id="ref12"><mixed-citation publication-type="other"><person-group person-group-type="author"><name><surname>Akbulut</surname><given-names>M.</given-names></name> <name><surname>Kevin Robinson</surname><given-names>K.</given-names></name> <name><surname>Maribeth Rauh</surname><given-names>M.</given-names></name> <name><surname>Isabela Albuquerque</surname><given-names>I.</given-names></name> <name><surname>Olivia Wiles</surname><given-names>O.</given-names></name> <name><surname>Laura Weidinger</surname><given-names>L.</given-names></name> <etal/></person-group>. (<year>2025</year>). &#x201C;<article-title>Century: A framework and dataset for evaluating historical contextualisation of sensitive images</article-title>&#x201D; in <source>The thirteenth international conference on learning representations</source>.</mixed-citation></ref>
<ref id="ref2"><mixed-citation publication-type="other"><person-group person-group-type="author"><name><surname>Andres</surname><given-names>J.</given-names></name> <name><surname>Danta</surname><given-names>C.</given-names></name> <name><surname>Bianchi</surname><given-names>A.</given-names></name> <name><surname>Farzanfar</surname><given-names>S.</given-names></name> <name><surname>Milena Fernandez-Nieto</surname><given-names>G.</given-names></name> <name><surname>Becker</surname><given-names>A.</given-names></name> <etal/></person-group>. (<year>2025</year>). &#x201C;<article-title>A scenario-based design pack for exploring multimodal human&#x2013;GenAI relations</article-title>&#x201D; in <source>Proceedings of the 27th international conference on multimodal interaction</source>, <fpage>145</fpage>&#x2013;<lpage>154</lpage>.</mixed-citation></ref>
<ref id="ref3"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Bai</surname><given-names>G.</given-names></name> <name><surname>Liu</surname><given-names>J.</given-names></name> <name><surname>Bu</surname><given-names>X.</given-names></name> <name><surname>He</surname><given-names>Y.</given-names></name> <name><surname>Liu</surname><given-names>J.</given-names></name> <name><surname>Zhou</surname><given-names>Z.</given-names></name> <etal/></person-group>. (<year>2024</year>). <article-title>Mt-bench-101: a fine-grained benchmark for evaluating large language models in multi-turn dialogues</article-title>. <source>arXiv preprint arXiv:2402.14762.</source></mixed-citation></ref>
<ref id="ref4"><mixed-citation publication-type="book"><person-group person-group-type="author"><name><surname>Bender</surname><given-names>E. M.</given-names></name> <name><surname>Gebru</surname><given-names>T.</given-names></name> <name><surname>McMillan-Major</surname><given-names>A.</given-names></name> <name><surname>Shmitchell</surname><given-names>S.</given-names></name></person-group> (<year>2021</year>). &#x201C;<article-title>On the dangers of stochastic parrots: can language models be too big?</article-title>&#x201D; in <source>Proceedings of the 2021 ACM conference on fairness, accountability, and transparency</source> (<publisher-loc>New York, NY</publisher-loc>: <publisher-name>Association for Computing Machinery</publisher-name>), <fpage>610</fpage>&#x2013;<lpage>623</lpage>.</mixed-citation></ref>
<ref id="ref5"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Bengio</surname><given-names>Y.</given-names></name> <name><surname>Courville</surname><given-names>A. C.</given-names></name> <name><surname>Vincent</surname><given-names>P.</given-names></name></person-group> (<year>2012</year>). <article-title>Unsupervised feature learning and deep learning: a review and new perspectives</article-title>. <source>CoRR</source> <volume>1</volume>.</mixed-citation></ref>
<ref id="ref6"><mixed-citation publication-type="other"><person-group person-group-type="author"><name><surname>Bhutani</surname><given-names>M.</given-names></name> <name><surname>Robinson</surname><given-names>K.</given-names></name> <name><surname>Prabhakaran</surname><given-names>V.</given-names></name> <name><surname>Dave</surname><given-names>S.</given-names></name> <name><surname>Dev</surname><given-names>S.</given-names></name></person-group> (<year>2024</year>). &#x201C;<article-title>SeeGULL multilingual: a dataset of geo-culturally situated stereotypes</article-title>&#x201D; in <source>Proceedings of the 62nd annual meeting of the Association for Computational Linguistics</source>, vol. <volume>2</volume>, <fpage>842</fpage>&#x2013;<lpage>854</lpage>.</mixed-citation></ref>
<ref id="ref7"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Blagec</surname><given-names>K.</given-names></name> <name><surname>Kraiger</surname><given-names>J.</given-names></name> <name><surname>Fr&#x00FC;hwirt</surname><given-names>W.</given-names></name> <name><surname>Samwald</surname><given-names>M.</given-names></name></person-group> (<year>2023</year>). <article-title>Benchmark datasets driving artificial intelligence development fail to capture the needs of medical professionals</article-title>. <source>J. Biomed. Inform.</source> <volume>137</volume>:<fpage>104274</fpage>. doi: <pub-id pub-id-type="doi">10.1016/j.jbi.2022.104274</pub-id>, <pub-id pub-id-type="pmid">36539106</pub-id></mixed-citation></ref>
<ref id="ref8"><mixed-citation publication-type="other"><person-group person-group-type="author"><name><surname>Boisson</surname><given-names>J.</given-names></name> <name><surname>Siddique</surname><given-names>Z.</given-names></name> <name><surname>Borkakoty</surname><given-names>H.</given-names></name> <name><surname>Antypas</surname><given-names>D.</given-names></name> <name><surname>Anke</surname><given-names>L. E.</given-names></name> <name><surname>Camacho-Collados</surname><given-names>J.</given-names></name></person-group> (<year>2025</year>). &#x201C;<article-title>Automatic extraction of metaphoric analogies from literary texts: task formulation, dataset construction, and evaluation</article-title>&#x201D; in <source>Proceedings of the 31st international conference on computational linguistics</source>, <fpage>6692</fpage>&#x2013;<lpage>6704</lpage>.</mixed-citation></ref>
<ref id="ref9"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Bolukbasi</surname><given-names>T.</given-names></name> <name><surname>Chang</surname><given-names>K.-W.</given-names></name> <name><surname>Zou</surname><given-names>J. Y.</given-names></name> <name><surname>Saligrama</surname><given-names>V.</given-names></name> <name><surname>Kalai</surname><given-names>A. T.</given-names></name></person-group> (<year>2016</year>). <article-title>Man is to computer programmer as woman is to homemaker? Debiasing word embeddings</article-title>. <source>Adv. Neural Inf. Process. Syst.</source> <volume>29</volume>.</mixed-citation></ref>
<ref id="ref10"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Brinkmann</surname><given-names>L.</given-names></name> <name><surname>Baumann</surname><given-names>F.</given-names></name> <name><surname>Bonnefon</surname><given-names>J.-F.</given-names></name> <name><surname>Derex</surname><given-names>M.</given-names></name> <name><surname>M&#x00FC;ller</surname><given-names>T. F.</given-names></name> <name><surname>Nussberger</surname><given-names>A.-M.</given-names></name> <etal/></person-group>. (<year>2023</year>). <article-title>Machine culture</article-title>. <source>Nat. Hum. Behav.</source> <volume>7</volume>, <fpage>1855</fpage>&#x2013;<lpage>1868</lpage>. doi: <pub-id pub-id-type="doi">10.1038/s41562-023-01742-2</pub-id>, <pub-id pub-id-type="pmid">37985914</pub-id></mixed-citation></ref>
<ref id="ref11"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Burnell</surname><given-names>R.</given-names></name> <name><surname>Schellaert</surname><given-names>W.</given-names></name> <name><surname>Burden</surname><given-names>J.</given-names></name> <name><surname>Ullman</surname><given-names>T. D.</given-names></name> <name><surname>Martinez-Plumed</surname><given-names>F.</given-names></name> <name><surname>Tenenbaum</surname><given-names>J. B.</given-names></name> <etal/></person-group>. (<year>2023</year>). <article-title>Rethink reporting of evaluation results in AI</article-title>. <source>Science</source> <volume>380</volume>, <fpage>136</fpage>&#x2013;<lpage>138</lpage>. doi: <pub-id pub-id-type="doi">10.1126/science.adf6369</pub-id>, <pub-id pub-id-type="pmid">37053341</pub-id></mixed-citation></ref>
<ref id="ref13"><mixed-citation publication-type="book"><person-group person-group-type="author"><name><surname>Caputo</surname><given-names>J. D.</given-names></name></person-group> (<year>2018</year>). <source>Hermeneutics: Facts and interpretation in the age of information</source>. <publisher-loc>London, UK</publisher-loc>: <publisher-name>Penguin UK</publisher-name>.</mixed-citation></ref>
<ref id="ref14"><mixed-citation publication-type="other"><person-group person-group-type="author"><name><surname>Caramiaux</surname><given-names>B.</given-names></name> <name><surname>Fdili Alaoui</surname><given-names>S.</given-names></name></person-group> (<year>2022</year>). <article-title>&#x201C;Explorers of unknown planets&#x201D;: practices and politics of artificial intelligence in visual arts</article-title>. <source>Proc. ACM hum.-Comput. Interact</source>. <volume>6</volume>.</mixed-citation></ref>
<ref id="ref15"><mixed-citation publication-type="book"><person-group person-group-type="author"><name><surname>Chakrabarty</surname><given-names>T.</given-names></name> <name><surname>Laban</surname><given-names>P.</given-names></name> <name><surname>Agarwal</surname><given-names>D.</given-names></name> <name><surname>Muresan</surname><given-names>S.</given-names></name> <name><surname>Wu</surname><given-names>C.-S.</given-names></name></person-group> (<year>2024</year>). &#x201C;<article-title>Art or artifice? Large language models and the false promise of creativity</article-title>&#x201D; in <source>Proceedings of the 2024 CHI conference on human factors in computing systems, CHI &#x2018;24</source> (<publisher-loc>New York, NY</publisher-loc>: <publisher-name>Association for Computing Machinery</publisher-name>).</mixed-citation></ref>
<ref id="ref16"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Chang</surname><given-names>Y.</given-names></name> <name><surname>Wang</surname><given-names>X.</given-names></name> <name><surname>Wang</surname><given-names>J.</given-names></name> <name><surname>Wu</surname><given-names>Y.</given-names></name> <name><surname>Yang</surname><given-names>L.</given-names></name> <name><surname>Zhu</surname><given-names>K.</given-names></name> <etal/></person-group>. (<year>2024</year>). <article-title>A survey on evaluation of large language models</article-title>. <source>ACM Trans. Intell. Syst. Technol.</source> <volume>15</volume>. doi: <pub-id pub-id-type="doi">10.1145/3641289</pub-id></mixed-citation></ref>
<ref id="ref17"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Chen</surname><given-names>B.</given-names></name> <name><surname>Zhang</surname><given-names>Z.</given-names></name> <name><surname>Langren&#x00E9;</surname><given-names>N.</given-names></name> <name><surname>Zhu</surname><given-names>S.</given-names></name></person-group> (<year>2025</year>). <article-title>Unleashing the potential of prompt engineering for large language models</article-title>. <source>Patterns</source> <volume>6</volume>. doi: <pub-id pub-id-type="doi">10.1016/j.patter.2025.101260</pub-id>, <pub-id pub-id-type="pmid">40575123</pub-id></mixed-citation></ref>
<ref id="ref18"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Chiu</surname><given-names>Y. Y.</given-names></name> <name><surname>Sharma</surname><given-names>A.</given-names></name> <name><surname>Lin</surname><given-names>I. W.</given-names></name> <name><surname>Althoff</surname><given-names>T.</given-names></name></person-group> (<year>2024</year>). <article-title>A computational framework for behavioral assessment of LLM therapists</article-title>. <source>arXiv preprint arXiv</source>.</mixed-citation></ref>
<ref id="ref19"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Collins</surname><given-names>K. M.</given-names></name> <name><surname>Sucholutsky</surname><given-names>I.</given-names></name> <name><surname>Bhatt</surname><given-names>U.</given-names></name> <name><surname>Chandra</surname><given-names>K.</given-names></name> <name><surname>Wong</surname><given-names>L.</given-names></name> <name><surname>Lee</surname><given-names>M.</given-names></name> <etal/></person-group>. (<year>2024</year>). <article-title>Building machines that learn and think with people</article-title>. <source>Nat. Hum. Behav.</source> <volume>8</volume>, <fpage>1851</fpage>&#x2013;<lpage>1863</lpage>. doi: <pub-id pub-id-type="doi">10.1038/s41562-024-01991-9</pub-id>, <pub-id pub-id-type="pmid">39438684</pub-id></mixed-citation></ref>
<ref id="ref20"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Denton</surname><given-names>R.</given-names></name> <name><surname>Hanna</surname><given-names>A.</given-names></name> <name><surname>Amironesei</surname><given-names>R.</given-names></name> <name><surname>Smart</surname><given-names>A.</given-names></name> <name><surname>Nicole</surname><given-names>H.</given-names></name> <name><surname>Scheuerman</surname><given-names>M. K.</given-names></name></person-group> (<year>2020</year>). <article-title>Bringing the people back in: contesting benchmark machine learning datasets</article-title>. <source>arXiv preprint arXiv</source>.</mixed-citation></ref>
<ref id="ref21"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Desai</surname><given-names>M. A.</given-names></name> <name><surname>Pasquetto</surname><given-names>I. V.</given-names></name> <name><surname>Jacobs</surname><given-names>A. Z.</given-names></name> <name><surname>Card</surname><given-names>D.</given-names></name></person-group> (<year>2024</year>). <article-title>An archival perspective on pretraining data</article-title>. <source>Patterns</source> <volume>5</volume>. doi: <pub-id pub-id-type="doi">10.1016/j.patter.2024.100966</pub-id>, <pub-id pub-id-type="pmid">38645763</pub-id></mixed-citation></ref>
<ref id="ref22"><mixed-citation publication-type="other"><person-group person-group-type="author"><name><surname>DeVrio</surname><given-names>A.</given-names></name> <name><surname>Cheng</surname><given-names>M.</given-names></name> <name><surname>Egede</surname><given-names>L.</given-names></name> <name><surname>Olteanu</surname><given-names>A.</given-names></name> <name><surname>Blodgett</surname><given-names>S. L.</given-names></name></person-group> (<year>2025</year>). &#x201C;<article-title>A taxonomy of linguistic expressions that contribute to anthropomorphism of language technologies</article-title>&#x201D; in <source>Proceedings of the 2025 CHI conference on human factors in computing systems</source>, <fpage>1</fpage>&#x2013;<lpage>18</lpage>.</mixed-citation></ref>
<ref id="ref23"><mixed-citation publication-type="book"><person-group person-group-type="author"><name><surname>Dilthey</surname><given-names>W.</given-names></name></person-group> (<year>1989</year>). <source>Introduction to the human sciences, volume 1</source>. <publisher-loc>Princeton, NJ</publisher-loc>: <publisher-name>Princeton University Press</publisher-name>.</mixed-citation></ref>
<ref id="ref24"><mixed-citation publication-type="book"><person-group person-group-type="author"><name><surname>Dobson</surname><given-names>J. E.</given-names></name></person-group> (<year>2019</year>). <source>Critical digital humanities: The search for a methodology</source>. <publisher-loc>Chicago, Illinois</publisher-loc>: <publisher-name>University of Illinois Press</publisher-name>.</mixed-citation></ref>
<ref id="ref25"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Dobson</surname><given-names>J. E.</given-names></name></person-group> (<year>2022</year>). <article-title>Vector hermeneutics: on the interpretation of vector space models of text</article-title>. <source>Digit. Scholarsh. Humanit.</source> <volume>37</volume>, <fpage>81</fpage>&#x2013;<lpage>93</lpage>.</mixed-citation></ref>
<ref id="ref26"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Doshi-Velez</surname><given-names>F.</given-names></name> <name><surname>Kim</surname><given-names>B.</given-names></name></person-group> (<year>2017</year>). <article-title>Towards a rigorous science of interpretable machine learning</article-title>. <source>Stat</source> <volume>1050</volume>:<fpage>2</fpage>.</mixed-citation></ref>
<ref id="ref27"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Earp</surname><given-names>B. D.</given-names></name> <name><surname>PorsdamMann</surname><given-names>S.</given-names></name> <name><surname>Aboy</surname><given-names>M.</given-names></name> <name><surname>Awad</surname><given-names>E.</given-names></name> <name><surname>Betzler</surname><given-names>M.</given-names></name> <name><surname>Botes</surname><given-names>M.</given-names></name> <etal/></person-group>. (<year>2025</year>). <article-title>Relational norms for human-AI cooperation</article-title>. <source>arXiv preprint arXiv</source>.</mixed-citation></ref>
<ref id="ref29"><mixed-citation publication-type="other"><person-group person-group-type="author"><name><surname>Empson</surname><given-names>W.</given-names></name></person-group> (<year>1930</year>). <source>Seven types of ambiguity</source>.</mixed-citation></ref>
<ref id="ref30"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Eriksson</surname><given-names>M.</given-names></name> <name><surname>Purificato</surname><given-names>E.</given-names></name> <name><surname>Noroozian</surname><given-names>A.</given-names></name> <name><surname>Vinagre</surname><given-names>J.</given-names></name> <name><surname>Chaslot</surname><given-names>G.</given-names></name> <name><surname>Gomez</surname><given-names>E.</given-names></name> <etal/></person-group>. (<year>2025</year>). <article-title>Can we trust AI benchmarks? An interdisciplinary review of current issues in AI evaluation</article-title>. <source>Proc. AAAI/ACM Conf. AI Ethics Soc.</source> <volume>8</volume>. doi: <pub-id pub-id-type="doi">10.1609/aies.v8i1.36595</pub-id></mixed-citation></ref>
<ref id="ref31"><mixed-citation publication-type="book"><person-group person-group-type="author"><name><surname>Ethayarajh</surname><given-names>K.</given-names></name></person-group> (<year>2019</year>). &#x201C;<article-title>How contextual are contextualized word representations? Comparing the geometry of BERT, ELMo, and GPT-2 embeddings</article-title>&#x201D; in <source>Proceedings of the 2019 conference on empirical methods in natural language processing and the 9th international joint conference on natural language processing (EMNLP-IJCNLP)</source> (<publisher-loc>Hong Kong, China</publisher-loc>: <publisher-name>Association for Computational Linguistics</publisher-name>), <fpage>55</fpage>&#x2013;<lpage>65</lpage>.</mixed-citation></ref>
<ref id="ref32"><mixed-citation publication-type="book"><person-group person-group-type="author"><name><surname>Ethayarajh</surname><given-names>K.</given-names></name> <name><surname>Jurafsky</surname><given-names>D.</given-names></name></person-group> (<year>2020</year>). &#x201C;<article-title>Utility is in the eye of the user: A critique of NLP leaderboards</article-title>&#x201D; in <source>Proceedings of the 2020 conference on empirical methods in natural language processing (EMNLP)</source> (<publisher-loc>New York City, NY</publisher-loc>: <publisher-name>Association for Computational Linguistics</publisher-name>), <fpage>4846</fpage>&#x2013;<lpage>4853</lpage>.</mixed-citation></ref>
<ref id="ref33"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Farrell</surname><given-names>H.</given-names></name> <name><surname>Gopnik</surname><given-names>A.</given-names></name> <name><surname>Shalizi</surname><given-names>C.</given-names></name> <name><surname>Evans</surname><given-names>J.</given-names></name></person-group> (<year>2025</year>). <article-title>Large AI models are cultural and social technologies</article-title>. <source>Science</source> <volume>387</volume>, <fpage>1153</fpage>&#x2013;<lpage>1156</lpage>. doi: <pub-id pub-id-type="doi">10.1126/science.adt9819</pub-id>, <pub-id pub-id-type="pmid">40080578</pub-id></mixed-citation></ref>
<ref id="ref34"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Frauenberger</surname><given-names>C.</given-names></name></person-group> (<year>2019</year>). <article-title>Entanglement HCI the next wave?</article-title> <source>ACM Trans. Comput. Hum. Interact.</source> <volume>27</volume>. doi: <pub-id pub-id-type="doi">10.1145/3364998</pub-id></mixed-citation></ref>
<ref id="ref35"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Frenda</surname><given-names>S.</given-names></name> <name><surname>Abercrombie</surname><given-names>G.</given-names></name> <name><surname>Basile</surname><given-names>V.</given-names></name> <name><surname>Pedrani</surname><given-names>A.</given-names></name> <name><surname>Panizzon</surname><given-names>R.</given-names></name> <name><surname>Cignarella</surname><given-names>A. T.</given-names></name> <etal/></person-group>. (<year>2024</year>). <article-title>Perspectivist approaches to natural language processing: a survey</article-title>. <source>Lang. Resour. Eval.</source>, <fpage>1</fpage>&#x2013;<lpage>28</lpage>.</mixed-citation></ref>
<ref id="ref28"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Freitas</surname><given-names>J. D.</given-names></name> <name><surname>Censi</surname><given-names>A.</given-names></name> <name><surname>WalkerSmith</surname><given-names>B.</given-names></name> <name><surname>DiLillo</surname><given-names>L.</given-names></name> <name><surname>Anthony</surname><given-names>S. E.</given-names></name> <name><surname>Frazzoli</surname><given-names>E.</given-names></name></person-group> (<year>2021</year>). <article-title>From driverless dilemmas to more practical commonsense tests for automated vehicles</article-title>. <source>Proc. Natl. Acad. Sci. USA</source> <volume>118</volume>:<fpage>e2010202118</fpage>. doi: <pub-id pub-id-type="doi">10.1073/pnas.2010202118</pub-id>, <pub-id pub-id-type="pmid">33649183</pub-id></mixed-citation></ref>
<ref id="ref36"><mixed-citation publication-type="other"><person-group person-group-type="author"><name><surname>Gadamer</surname><given-names>H.-G</given-names></name></person-group>. (<year>1960</year>). <source>Truth and method</source>.</mixed-citation></ref>
<ref id="ref37"><mixed-citation publication-type="book"><person-group person-group-type="author"><name><surname>Gaver</surname><given-names>W. W.</given-names></name> <name><surname>Beaver</surname><given-names>J.</given-names></name> <name><surname>Benford</surname><given-names>S.</given-names></name></person-group> (<year>2003</year>). &#x201C;<article-title>Ambiguity as a resource for design</article-title>&#x201D; in <source>Proceedings of the SIGCHI conference on human factors in computing systems</source> (<publisher-loc>New York, NY</publisher-loc>: <publisher-name>Association for Computing Machinery</publisher-name>), <fpage>233</fpage>&#x2013;<lpage>240</lpage>.</mixed-citation></ref>
<ref id="ref38"><mixed-citation publication-type="book"><person-group person-group-type="author"><name><surname>Ge</surname><given-names>X.</given-names></name> <name><surname>Xu</surname><given-names>C.</given-names></name> <name><surname>Misaki</surname><given-names>D.</given-names></name> <name><surname>Markus</surname><given-names>H. R.</given-names></name> <name><surname>Tsai</surname><given-names>J. L.</given-names></name></person-group> (<year>2024</year>). &#x201C;<article-title>How culture shapes what people want from AI</article-title>&#x201D; in <source>Proceedings of the 2024 CHI conference on human factors in computing systems, CHI &#x2018;24</source> (<publisher-loc>New York, NY</publisher-loc>: <publisher-name>Association for Computing Machinery</publisher-name>).</mixed-citation></ref>
<ref id="ref39"><mixed-citation publication-type="book"><person-group person-group-type="author"><name><surname>Geertz</surname><given-names>C.</given-names></name></person-group> (<year>1973</year>). <source>The interpretation of cultures</source>. <publisher-loc>New York City, NY</publisher-loc>: <publisher-name>Basic Books</publisher-name>.</mixed-citation></ref>
<ref id="ref40"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Hall</surname><given-names>S.</given-names></name></person-group> (<year>1997</year>). <article-title>Representation: cultural representations and signifying practices</article-title>. <source>Culture</source>.</mixed-citation></ref>
<ref id="ref41"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Haraway</surname><given-names>D.</given-names></name></person-group> (<year>1988</year>). <article-title>Situated knowledges: the science question in feminism and the privilege of partial perspective</article-title>. <source>Feminist Stud.</source> <volume>14</volume>, <fpage>575</fpage>&#x2013;<lpage>599</lpage>.</mixed-citation></ref>
<ref id="ref42"><mixed-citation publication-type="other"><person-group person-group-type="author"><name><surname>Heidegger</surname><given-names>M.</given-names></name></person-group> (<year>1927</year>). <source>Being and time</source>.</mixed-citation></ref>
<ref id="ref43"><mixed-citation publication-type="book"><person-group person-group-type="author"><name><surname>Hemment</surname><given-names>D.</given-names></name> <name><surname>Kommers</surname><given-names>C.</given-names></name> <etal/></person-group>. (<year>2025</year>). <source>Doing AI differently: Rethinking the foundations of AI via the humanities. Technical report</source>. <publisher-loc>London</publisher-loc>: <publisher-name>The Alan Turing Institute</publisher-name>.</mixed-citation></ref>
<ref id="ref44"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Hemment</surname><given-names>D.</given-names></name> <name><surname>Murray-Rust</surname><given-names>D.</given-names></name> <name><surname>Belle</surname><given-names>V.</given-names></name> <name><surname>Aylett</surname><given-names>R.</given-names></name> <name><surname>Vidmar</surname><given-names>M.</given-names></name> <name><surname>Broz</surname><given-names>F.</given-names></name></person-group> (<year>2024</year>). <article-title>Experiential AI: between arts and explainable AI</article-title>. <source>Leonardo</source> <volume>57</volume>, <fpage>298</fpage>&#x2013;<lpage>306</lpage>.</mixed-citation></ref>
<ref id="ref45"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Heuser</surname><given-names>R.</given-names></name></person-group> (<year>2025</year>). <article-title>Cultural collapse: toward a generative formalism for AI cultural production</article-title>. <source>Anthology Computers Humanities</source> <volume>3</volume>, <fpage>575</fpage>&#x2013;<lpage>588</lpage>. doi: <pub-id pub-id-type="doi">10.63744/usvuyzsiapvy</pub-id></mixed-citation></ref>
<ref id="ref46"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Ibrahim</surname><given-names>L.</given-names></name> <name><surname>Akbulut</surname><given-names>C.</given-names></name> <name><surname>Elasmar</surname><given-names>R.</given-names></name> <name><surname>Rastogi</surname><given-names>C.</given-names></name> <name><surname>Kahng</surname><given-names>M.</given-names></name> <name><surname>Morris</surname><given-names>M. R.</given-names></name> <etal/></person-group>. (<year>2025a</year>). <article-title>Multi-turn evaluation of anthropomorphic behaviours in large language models</article-title>. <source>arXiv preprint arXiv:2502.07077.</source></mixed-citation></ref>
<ref id="ref47"><mixed-citation publication-type="other"><person-group person-group-type="author"><name><surname>Ibrahim</surname><given-names>L.</given-names></name> <name><surname>Huang</surname><given-names>S.</given-names></name> <name><surname>Ahmad</surname><given-names>L.</given-names></name> <name><surname>Bhatt</surname><given-names>U.</given-names></name> <name><surname>Anderljung</surname><given-names>M.</given-names></name></person-group> (<year>2025b</year>). <article-title>Towards interactive evaluations for interaction harms in human-AI systems</article-title>. In <source>Proceedings of the AAAI/ACM conference on AI, ethics, and society</source> (Vol. <volume>8</volume>. pp. <fpage>1302</fpage>&#x2013;<lpage>1310</lpage>).</mixed-citation></ref>
<ref id="ref48"><mixed-citation publication-type="book"><person-group person-group-type="author"><name><surname>James</surname><given-names>G.</given-names></name> <name><surname>Witten</surname><given-names>D.</given-names></name> <name><surname>Hastie</surname><given-names>T.</given-names></name> <name><surname>Tibshirani</surname><given-names>R.</given-names></name></person-group> (<year>2013</year>). <source>An introduction to statistical learning: With applications in R, volume 103</source>. <publisher-loc>New York City, NY</publisher-loc>: <publisher-name>Springer</publisher-name>.</mixed-citation></ref>
<ref id="ref49"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>John</surname><given-names>Y. J.</given-names></name> <name><surname>Caldwell</surname><given-names>L.</given-names></name> <name><surname>McCoy</surname><given-names>D. E.</given-names></name> <name><surname>Braganza</surname><given-names>O.</given-names></name></person-group> (<year>2024</year>). <article-title>Deadrats, dopamine, performance metrics, and peacock tails: proxy failure is an inherent risk in goal-oriented systems</article-title>. <source>Behav. Brain Sci.</source> <volume>47</volume>:<fpage>e67</fpage>.</mixed-citation></ref>
<ref id="ref50"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Kapoor</surname><given-names>S.</given-names></name> <name><surname>Stroebl</surname><given-names>B.</given-names></name> <name><surname>Siegel</surname><given-names>Z. S.</given-names></name> <name><surname>Nadgir</surname><given-names>N.</given-names></name> <name><surname>Narayanan</surname><given-names>A.</given-names></name></person-group> (<year>2024</year>). <article-title>AI agents that matter</article-title>. <source>arXiv preprint arXiv</source>.</mixed-citation></ref>
<ref id="ref51"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Klein</surname><given-names>L.</given-names></name> <name><surname>Martin</surname><given-names>M.</given-names></name> <name><surname>Brock</surname><given-names>A.</given-names></name> <name><surname>Antoniak</surname><given-names>M.</given-names></name> <name><surname>Walsh</surname><given-names>M.</given-names></name> <name><surname>Johnson</surname><given-names>J. M.</given-names></name> <etal/></person-group>. (<year>2025</year>). <article-title>Provocations from the humanities for generative AI research</article-title>. <source>arXiv preprint arXiv</source>.</mixed-citation></ref>
<ref id="ref52"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Koch</surname><given-names>B. J.</given-names></name> <name><surname>Peterson</surname><given-names>D.</given-names></name></person-group> (<year>2024</year>). <article-title>From protoscience to epistemic monoculture: how benchmarking set the stage for the deep learning revolution</article-title>. <source>arXiv preprint arXiv</source>.</mixed-citation></ref>
<ref id="ref53"><mixed-citation publication-type="other"><person-group person-group-type="author"><name><surname>Kommers</surname><given-names>C.</given-names></name> <name><surname>DeDeo</surname><given-names>S.</given-names></name></person-group> (<year>2025</year>). &#x201C;<article-title>Sense-making, cultural scripts, and the inferential basis of meaningful experience</article-title>&#x201D; in <source>Proceedings of the annual meeting of the cognitive science society</source>, vol. <volume>47</volume>.</mixed-citation></ref>
<ref id="ref54"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Kommers</surname><given-names>C.</given-names></name> <name><surname>Duede</surname><given-names>E.</given-names></name> <name><surname>Gordon</surname><given-names>J.</given-names></name> <name><surname>Holtzman</surname><given-names>A.</given-names></name> <name><surname>McNulty</surname><given-names>T.</given-names></name> <name><surname>Stewart</surname><given-names>S.</given-names></name> <etal/></person-group>. (<year>2025a</year>). <article-title>Why slop matters</article-title>. <source>arXiv preprint arXiv</source>:<fpage>2601.06060</fpage>.</mixed-citation></ref>
<ref id="ref55"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Kommers</surname><given-names>C.</given-names></name> <name><surname>Hemment</surname><given-names>D.</given-names></name> <name><surname>Antoniak</surname><given-names>M.</given-names></name> <name><surname>Leibo</surname><given-names>J. Z.</given-names></name></person-group> (<year>2025b</year>). <article-title>Meaning is not a metric: using LLMs to make cultural context legible at scale</article-title>. <source>arXiv preprint arXiv</source>.</mixed-citation></ref>
<ref id="ref56"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Kozlowski</surname><given-names>A. C.</given-names></name> <name><surname>Taddy</surname><given-names>M.</given-names></name> <name><surname>Evans</surname><given-names>J. A.</given-names></name></person-group> (<year>2019</year>). <article-title>The geometry of culture: analyzing the meanings of class through word embeddings</article-title>. <source>Am. Sociol. Rev.</source> <volume>84</volume>, <fpage>905</fpage>&#x2013;<lpage>949</lpage>.</mixed-citation></ref>
<ref id="ref57"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Lazar</surname><given-names>S.</given-names></name> <name><surname>Nelson</surname><given-names>A.</given-names></name></person-group> (<year>2023</year>). <article-title>AI safety on whose terms?</article-title> <source>Science</source> <volume>381</volume>:<fpage>138</fpage>. doi: <pub-id pub-id-type="doi">10.1126/science.adi8982</pub-id>, <pub-id pub-id-type="pmid">37440644</pub-id></mixed-citation></ref>
<ref id="ref58"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Leibo</surname><given-names>J. Z.</given-names></name> <name><surname>Vezhnevets</surname><given-names>A. S.</given-names></name> <name><surname>Diaz</surname><given-names>M.</given-names></name> <name><surname>Agapiou</surname><given-names>J. P.</given-names></name> <name><surname>Cunningham</surname><given-names>W. A.</given-names></name> <name><surname>Sunehag</surname><given-names>P.</given-names></name> <etal/></person-group>. (<year>2024</year>). <article-title>A theory of appropriateness with applications to generative artificial intelligence</article-title>. <source>arXiv preprint arXiv</source>.</mixed-citation></ref>
<ref id="ref59"><mixed-citation publication-type="book"><person-group person-group-type="author"><name><surname>Levinson</surname><given-names>S.</given-names></name> <name><surname>Mailloux</surname><given-names>S.</given-names></name></person-group> (<year>1988</year>). <source>Interpreting law and literature: A hermeneutic reader</source>. <publisher-loc>Chicago, Illinois</publisher-loc>: <publisher-name>North- western University Press</publisher-name>.</mixed-citation></ref>
<ref id="ref60"><mixed-citation publication-type="other"><person-group person-group-type="author"><name><surname>Li</surname><given-names>M.</given-names></name> <name><surname>Chen</surname><given-names>J.</given-names></name> <name><surname>Chen</surname><given-names>L.</given-names></name> <name><surname>Zhou</surname><given-names>T.</given-names></name></person-group> (<year>2024</year>). &#x201C;<article-title>Can LLMs speak for diverse people? Tuning LLMs via debate to generate controllable controversial statements</article-title>&#x201D; in <source>Findings of the Association for Computational Linguistics ACL 2024</source>, <fpage>16160</fpage>&#x2013;<lpage>16176</lpage>.</mixed-citation></ref>
<ref id="ref61"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Liang</surname><given-names>P.</given-names></name> <name><surname>Bommasani</surname><given-names>R.</given-names></name> <name><surname>Lee</surname><given-names>T.</given-names></name> <name><surname>Tsipras</surname><given-names>D.</given-names></name> <name><surname>Soylu</surname><given-names>D.</given-names></name> <name><surname>Yasunaga</surname><given-names>M.</given-names></name> <etal/></person-group>. (<year>2023</year>). <article-title>Holistic evaluation of language models</article-title>. <source>Transactions Machine Learning Research</source>.</mixed-citation></ref>
<ref id="ref62"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Liao</surname><given-names>Q. V.</given-names></name> <name><surname>Xiao</surname><given-names>Z.</given-names></name></person-group> (<year>2023</year>). <article-title>Rethinking model evaluation as narrowing the socio-technical gap</article-title>. <source>arXiv preprint arXiv</source>.</mixed-citation></ref>
<ref id="ref63"><mixed-citation publication-type="other"><person-group person-group-type="author"><name><surname>Lowe</surname><given-names>R.</given-names></name> <name><surname>Edelman</surname><given-names>J.</given-names></name> <name><surname>Zhi-Xuan</surname><given-names>T.</given-names></name> <name><surname>Klingefjord</surname><given-names>O.</given-names></name> <name><surname>Hain</surname><given-names>E.</given-names></name> <name><surname>Wang</surname><given-names>V.</given-names></name> <etal/></person-group>. (<year>2025</year>). &#x201C;<article-title>Full-stack alignment: co-aligning AI and institutions with thicker models of value</article-title>&#x201D; in <source>2nd workshop on models of human feedback for AI alignment</source>.</mixed-citation></ref>
<ref id="ref64"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Malaviya</surname><given-names>C.</given-names></name> <name><surname>Chang</surname><given-names>J. C.</given-names></name> <name><surname>Roth</surname><given-names>D.</given-names></name> <name><surname>Iyyer</surname><given-names>M.</given-names></name> <name><surname>Yatskar</surname><given-names>M.</given-names></name> <name><surname>Lo</surname><given-names>K.</given-names></name></person-group> (<year>2025</year>). <article-title>Contextualized evaluations: judging language model responses to underspecified queries</article-title>. <source>Trans. Assoc. Comput. Linguist.</source> <volume>13</volume>, <fpage>878</fpage>&#x2013;<lpage>900</lpage>.</mixed-citation></ref>
<ref id="ref65"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Marco</surname><given-names>G.</given-names></name> <name><surname>Gonzalo</surname><given-names>J.</given-names></name> <name><surname>Fresno</surname><given-names>V.</given-names></name></person-group> (<year>2025</year>). <article-title>The reader is the metric: how textual features and reader profiles explain conflicting evaluations of AI creative writing</article-title>. <source>arXiv preprint arXiv</source>.</mixed-citation></ref>
<ref id="ref66"><mixed-citation publication-type="other"><person-group person-group-type="author"><name><surname>McIntosh</surname><given-names>T.</given-names></name> <name><surname>Susnjak</surname><given-names>T.</given-names></name> <name><surname>Arachchilage</surname><given-names>N.</given-names></name> <name><surname>Liu</surname><given-names>T.</given-names></name> <name><surname>Xu</surname><given-names>D.</given-names></name> <name><surname>Watters</surname><given-names>P.</given-names></name> <etal/></person-group>. (<year>2025</year>). <article-title>Inadequacies of large language model benchmarks in the era of generative artificial intelli- gence</article-title>. <source>IEEE Trans. Artif. Intell.</source></mixed-citation></ref>
<ref id="ref67"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Messeri</surname><given-names>L.</given-names></name> <name><surname>Crockett</surname><given-names>M. J.</given-names></name></person-group> (<year>2024</year>). <article-title>Artificial intelligence and illusions of understanding in scientific research</article-title>. <source>Nature</source> <volume>627</volume>, <fpage>49</fpage>&#x2013;<lpage>58</lpage>. doi: <pub-id pub-id-type="doi">10.1038/s41586-024-07146-0</pub-id>, <pub-id pub-id-type="pmid">38448693</pub-id></mixed-citation></ref>
<ref id="ref68"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Mihai</surname><given-names>D.</given-names></name> <name><surname>Hare</surname><given-names>J.</given-names></name></person-group> (<year>2021</year>). <article-title>Learning to draw: emergent communication through sketching</article-title>. <source>Adv. Neural Inf. Process. Syst.</source> <volume>34</volume>, <fpage>7153</fpage>&#x2013;<lpage>7166</lpage>.</mixed-citation></ref>
<ref id="ref69"><mixed-citation publication-type="other"><person-group person-group-type="author"><name><surname>Mihalcea</surname><given-names>R.</given-names></name> <name><surname>Ignat</surname><given-names>O.</given-names></name> <name><surname>Bai</surname><given-names>L.</given-names></name> <name><surname>Borah</surname><given-names>A.</given-names></name> <name><surname>Chiruzzo</surname><given-names>L.</given-names></name> <name><surname>Jin</surname><given-names>Z.</given-names></name> <etal/></person-group>. (<year>2025</year>). <article-title>Why AI is WEIRD and shouldn't be this way: towards AI for everyone, with everyone, by everyone</article-title>. In <source>Proceedings of the AAAI conference on artificial intelligence</source> (Vol. <volume>39</volume>. pp. <fpage>28657</fpage>&#x2013;<lpage>28670</lpage>).</mixed-citation></ref>
<ref id="ref70"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Mikolov</surname><given-names>T.</given-names></name> <name><surname>Sutskever</surname><given-names>I.</given-names></name> <name><surname>Chen</surname><given-names>K.</given-names></name> <name><surname>Corrado</surname><given-names>G. S.</given-names></name> <name><surname>Dean</surname><given-names>J.</given-names></name></person-group> (<year>2013</year>). <article-title>Distributed representations of words and phrases and their compositionality</article-title>. <source>Adv. Neural Inf. Process. Syst.</source> <volume>26</volume>.</mixed-citation></ref>
<ref id="ref71"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Mizrahi</surname><given-names>M.</given-names></name> <name><surname>Kaplan</surname><given-names>G.</given-names></name> <name><surname>Malkin</surname><given-names>D.</given-names></name> <name><surname>Dror</surname><given-names>R.</given-names></name> <name><surname>Shahaf</surname><given-names>D.</given-names></name> <name><surname>Stanovsky</surname><given-names>G.</given-names></name></person-group> (<year>2024</year>). <article-title>State of what art? A call for multi-prompt LLM evaluation</article-title>. <source>Trans. Assoc. Comput. Linguist.</source> <volume>12</volume>, <fpage>933</fpage>&#x2013;<lpage>949</lpage>. doi: <pub-id pub-id-type="doi">10.1162/tacl</pub-id></mixed-citation></ref>
<ref id="ref72"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Mohr</surname><given-names>J. W.</given-names></name> <name><surname>Wagner-Pacifici</surname><given-names>R.</given-names></name> <name><surname>Breiger</surname><given-names>R. L.</given-names></name></person-group> (<year>2015</year>). <article-title>Toward a computational hermeneutics</article-title>. <source>Big Data Soc.</source> <volume>2</volume>:<fpage>2053951715613809</fpage>. doi: <pub-id pub-id-type="doi">10.1177/2053951715613809</pub-id></mixed-citation></ref>
<ref id="ref73"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Murray-Browne</surname><given-names>T.</given-names></name> <name><surname>Tigas</surname><given-names>P.</given-names></name></person-group> (<year>2021</year>). <article-title>Emergent interfaces: vague, complex, bespoke and embodied interaction between humans and computers</article-title>. <source>Appl. Sci.</source> <volume>11</volume>:<fpage>8531</fpage>. doi: <pub-id pub-id-type="doi">10.3390/app11188531</pub-id></mixed-citation></ref>
<ref id="ref74"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Navigli</surname><given-names>R.</given-names></name></person-group> (<year>2009</year>). <article-title>Word sense disambiguation: a survey</article-title>. <source>ACM Computing Surveys</source> <volume>41</volume>, <fpage>1</fpage>&#x2013;<lpage>69</lpage>.</mixed-citation></ref>
<ref id="ref75"><mixed-citation publication-type="other"><person-group person-group-type="author"><name><surname>Nayak</surname><given-names>S.</given-names></name> <name><surname>Bhatia</surname><given-names>M.</given-names></name> <name><surname>Zhang</surname><given-names>X.</given-names></name> <name><surname>Rieser</surname><given-names>V.</given-names></name> <name><surname>Hendricks</surname><given-names>L. A.</given-names></name> <name><surname>Van Steenkiste</surname><given-names>S.</given-names></name> <etal/></person-group>. (<year>2025</year>). &#x201C;<article-title>Culturalframes: assessing cultural expectation alignment in text-to-image models and evaluation metrics</article-title>&#x201D; in <source>Findings of the Association for Computational Linguistics: EMNLP</source>, <fpage>20918</fpage>&#x2013;<lpage>20953</lpage>.</mixed-citation></ref>
<ref id="ref76"><mixed-citation publication-type="other"><person-group person-group-type="author"><name><surname>Norah Alzahrani</surname><given-names>N.</given-names></name> <name><surname>Hisham Alyahya</surname><given-names>H.</given-names></name> <name><surname>Yazeed Alnumay</surname><given-names>Y.</given-names></name> <name><surname>Sultan AlRashed</surname><given-names>S.</given-names></name> <name><surname>Shaykhah Alsubaie</surname><given-names>S.</given-names></name> <name><surname>Yousef Al- mushayqih</surname><given-names>Y.</given-names></name> <etal/></person-group>. (<year>2024</year>). <article-title>When benchmarks are targets: revealing the sensitivity of large language model leaderboards</article-title>. In <source>Proceedings of the 62nd annual meeting of the Association for Computational Linguistics</source> (Volume <volume>1</volume>: Long Papers), pages <fpage>13787</fpage>&#x2013;<lpage>13805</lpage>, <publisher-loc>Bangkok, Thailand</publisher-loc>. <publisher-name>Association for Computational Linguistics</publisher-name>.</mixed-citation></ref>
<ref id="ref77"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Ott</surname><given-names>S.</given-names></name> <name><surname>Barbosa-Silva</surname><given-names>A.</given-names></name> <name><surname>Blagec</surname><given-names>K.</given-names></name> <name><surname>Brauner</surname><given-names>J.</given-names></name> <name><surname>Samwald</surname><given-names>M.</given-names></name></person-group> (<year>2022</year>). <article-title>Mapping global dynamics of benchmark creation and saturation in artificial intelligence</article-title>. <source>Nat. Commun.</source> <volume>13</volume>:<fpage>6793</fpage>. doi: <pub-id pub-id-type="doi">10.1038/s41467-022-34591-0</pub-id>, <pub-id pub-id-type="pmid">36357391</pub-id></mixed-citation></ref>
<ref id="ref78"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Ouyang</surname><given-names>L.</given-names></name> <name><surname>Wu</surname><given-names>J.</given-names></name> <name><surname>Jiang</surname><given-names>X.</given-names></name> <name><surname>Almeida</surname><given-names>D.</given-names></name> <name><surname>Wainwright</surname><given-names>C.</given-names></name> <name><surname>Mishkin</surname><given-names>P.</given-names></name> <etal/></person-group>. (<year>2022</year>). <article-title>Training language models to follow instructions with human feedback</article-title>. <source>Adv. Neural Inf. Process. Syst.</source> <volume>35</volume>, <fpage>27730</fpage>&#x2013;<lpage>27744</lpage>.</mixed-citation></ref>
<ref id="ref79"><mixed-citation publication-type="book"><person-group person-group-type="author"><name><surname>Pennington</surname><given-names>J.</given-names></name> <name><surname>Socher</surname><given-names>R.</given-names></name> <name><surname>Manning</surname><given-names>C.</given-names></name></person-group> (<year>2014</year>). &#x201C;<article-title>GloVe: global vectors for word represen- tation</article-title>&#x201D; in <source>Proceedings of the 2014 conference on empirical methods in natural language processing (EMNLP)</source> (<publisher-loc>Doha, Qatar</publisher-loc>: <publisher-name>Association for Computational Linguistics</publisher-name>), <fpage>1532</fpage>&#x2013;<lpage>1543</lpage>.</mixed-citation></ref>
<ref id="ref80"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Peter</surname><given-names>S.</given-names></name> <name><surname>Riemer</surname><given-names>K.</given-names></name> <name><surname>West</surname><given-names>J. D.</given-names></name></person-group> (<year>2025</year>). <article-title>The benefits and dangers of anthropomorphic conversational agents</article-title>. <source>Proc. Natl. Acad. Sci. USA</source> <volume>122</volume>:<fpage>e2415898122</fpage>. doi: <pub-id pub-id-type="doi">10.1073/pnas.2415898122</pub-id>, <pub-id pub-id-type="pmid">40378006</pub-id></mixed-citation></ref>
<ref id="ref81"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Placani</surname><given-names>A.</given-names></name></person-group> (<year>2024</year>). <article-title>Anthropomorphism in AI: hype and fallacy</article-title>. <source>AI Ethics</source> <volume>4</volume>, <fpage>691</fpage>&#x2013;<lpage>698</lpage>. doi: <pub-id pub-id-type="doi">10.1007/s43681-024-00419-4</pub-id></mixed-citation></ref>
<ref id="ref82"><mixed-citation publication-type="confproc"><person-group person-group-type="author"><name><surname>Raji</surname><given-names>I. D.</given-names></name> <name><surname>Denton</surname><given-names>E.</given-names></name> <name><surname>Bender</surname><given-names>E. M.</given-names></name> <name><surname>Hanna</surname><given-names>A.</given-names></name> <name><surname>Paullada</surname><given-names>A.</given-names></name></person-group> (<year>2021</year>). <article-title>AI and the everything in the whole wide world benchmark</article-title>. In <conf-name>Thirty-fifth Conference on Neural Information Processing Systems Datasets and Benchmarks Track (Round 2)</conf-name>.</mixed-citation></ref>
<ref id="ref83"><mixed-citation publication-type="confproc"><person-group person-group-type="author"><name><surname>Rastogi</surname><given-names>C.</given-names></name> <name><surname>Teh</surname><given-names>T. H.</given-names></name> <name><surname>Mishra</surname><given-names>P.</given-names></name> <name><surname>Patel</surname><given-names>R.</given-names></name> <name><surname>Wang</surname><given-names>D.</given-names></name> <name><surname>Diaz</surname><given-names>M.</given-names></name> <etal/></person-group>. (<year>2026</year>). <article-title>Whose view of safety? A deep DIVE dataset for pluralistic alignment of text-to-image models</article-title>. In <conf-name>The Thirty-ninth Annual Conference on Neural Information Processing Systems Datasets and Benchmarks Track</conf-name>.</mixed-citation></ref>
<ref id="ref84"><mixed-citation publication-type="other"><person-group person-group-type="author"><name><surname>Ravichander</surname><given-names>A.</given-names></name> <name><surname>Fisher</surname><given-names>J.</given-names></name> <name><surname>Sorensen</surname><given-names>T.</given-names></name> <name><surname>Lu</surname><given-names>X.</given-names></name> <name><surname>Antoniak</surname><given-names>M.</given-names></name> <name><surname>Lin</surname><given-names>B. Y.</given-names></name> <etal/></person-group>. (<year>2025</year>). &#x201C;<article-title>Information-guided identification of training data imprint in (proprietary) large language models</article-title>&#x201D; in <source>Proceedings of the 2025 conference of the nations of the Americas chapter of the Association for Computational Linguistics: Human language technologies</source>, vol. <volume>1</volume>, <fpage>1962</fpage>&#x2013;<lpage>1978</lpage>.</mixed-citation></ref>
<ref id="ref85"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Rebera</surname><given-names>A. P.</given-names></name> <name><surname>Lauwaert</surname><given-names>L.</given-names></name> <name><surname>Oimann</surname><given-names>A.-K.</given-names></name></person-group> (<year>2025</year>). <article-title>Hidden risks: artificial intelligence and hermeneutic harm</article-title>. <source>Minds Mach.</source> <volume>35</volume>:<fpage>33</fpage>. doi: <pub-id pub-id-type="doi">10.1007/s11023-025-09733-0</pub-id></mixed-citation></ref>
<ref id="ref86"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Ren</surname><given-names>R.</given-names></name> <name><surname>Basart</surname><given-names>S.</given-names></name> <name><surname>Khoja</surname><given-names>A.</given-names></name> <name><surname>Gatti</surname><given-names>A.</given-names></name> <name><surname>Phan</surname><given-names>L.</given-names></name> <name><surname>Yin</surname><given-names>X.</given-names></name> <etal/></person-group>. (<year>2024</year>). <article-title>Safetywashing: do AI safety benchmarks actually measure safety progress?</article-title> <source>Adv. Neural Inf. Process. Syst.</source> <volume>37</volume>, <fpage>68559</fpage>&#x2013;<lpage>68594</lpage>.</mixed-citation></ref>
<ref id="ref87"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Reuel-Lamparth</surname><given-names>A.</given-names></name> <name><surname>Hardy</surname><given-names>A.</given-names></name> <name><surname>Smith</surname><given-names>C.</given-names></name> <name><surname>Lamparth</surname><given-names>M.</given-names></name> <name><surname>Hardy</surname><given-names>M.</given-names></name> <name><surname>Kochenderfer</surname><given-names>M. J.</given-names></name></person-group> (<year>2024</year>). <article-title>Betterbench: assessing AI benchmarks, uncovering issues, and establishing best practices</article-title>. <source>Adv. Neural Inf. Process. Syst.</source> <volume>37</volume>, <fpage>21763</fpage>&#x2013;<lpage>21813</lpage>.</mixed-citation></ref>
<ref id="ref88"><mixed-citation publication-type="book"><person-group person-group-type="author"><name><surname>Ricoeur</surname><given-names>P.</given-names></name></person-group> (<year>1981</year>). <source>Hermeneutics and the human sciences: Essays on language, action and interpretation</source>. <publisher-loc>Cambridge, UK</publisher-loc>: <publisher-name>Cambridge University Press</publisher-name>.</mixed-citation></ref>
<ref id="ref89"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Ringler</surname><given-names>H.</given-names></name></person-group> (<year>2024</year>). <article-title>Computation and hermeneutics</article-title>. <source>Computational Humanities</source>:<fpage>1967</fpage>.</mixed-citation></ref>
<ref id="ref90"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Romele</surname><given-names>A.</given-names></name> <name><surname>Severo</surname><given-names>M.</given-names></name> <name><surname>Furia</surname><given-names>P.</given-names></name></person-group> (<year>2020</year>). <article-title>Digital hermeneutics: from interpreting with machines to interpretational machines</article-title>. <source>AI &#x0026; Soc.</source> <volume>35</volume>, <fpage>73</fpage>&#x2013;<lpage>86</lpage>.</mixed-citation></ref>
<ref id="ref91"><mixed-citation publication-type="book"><person-group person-group-type="author"><name><surname>Rosen</surname><given-names>S.</given-names></name></person-group> (<year>2003</year>). <source>Hermeneutics as politics</source>. <publisher-loc>New Haven, CT</publisher-loc>: <publisher-name>Yale University Press</publisher-name>.</mixed-citation></ref>
<ref id="ref92"><mixed-citation publication-type="other"><person-group person-group-type="author"><name><surname>Schlangen</surname><given-names>D.</given-names></name></person-group> (<year>2021</year>). &#x201C;<article-title>Targeting the benchmark: on methodology in current natural language processing research</article-title>&#x201D; in <source>Proceedings of the 59th annual meeting of the Association for Computational Linguistics and the 11th international joint conference on natural language processing</source>, vol. <volume>2</volume>, <fpage>670</fpage>&#x2013;<lpage>674</lpage>.</mixed-citation></ref>
<ref id="ref93"><mixed-citation publication-type="book"><person-group person-group-type="author"><name><surname>Schleiermacher</surname><given-names>F.</given-names></name></person-group> (<year>1998</year>). <source>Schleiermacher: Hermeneutics and criticism: and other writings</source>. <publisher-loc>Cambridge, UK</publisher-loc>: <publisher-name>Cambridge University Press</publisher-name>.</mixed-citation></ref>
<ref id="ref94"><mixed-citation publication-type="other"><person-group person-group-type="author"><name><surname>Sharma</surname><given-names>A.</given-names></name> <name><surname>Rushton</surname><given-names>K.</given-names></name> <name><surname>Lin</surname><given-names>I. W.</given-names></name> <name><surname>Nguyen</surname><given-names>T.</given-names></name> <name><surname>Althoff</surname><given-names>T.</given-names></name></person-group> (<year>2024</year>). &#x201C;<article-title>Facilitating self- guided mental health interventions through human-language model interaction: A case study of cognitive restructuring</article-title>&#x201D; in <source>Proceedings of the 2024 CHI conference on human factors in computing systems</source>, <fpage>1</fpage>&#x2013;<lpage>29</lpage>.</mixed-citation></ref>
<ref id="ref95"><mixed-citation publication-type="book"><person-group person-group-type="author"><name><surname>Simpson</surname><given-names>L. C.</given-names></name></person-group> (<year>2020</year>). <source>Hermeneutics as critique: Science, politics, race, and culture</source>. <publisher-loc>New York City, NY</publisher-loc>: <publisher-name>Columbia University Press</publisher-name>.</mixed-citation></ref>
<ref id="ref96"><mixed-citation publication-type="other"><person-group person-group-type="author"><name><surname>Sorensen</surname><given-names>T.</given-names></name> <name><surname>Moore</surname><given-names>J.</given-names></name> <name><surname>Fisher</surname><given-names>J.</given-names></name> <name><surname>Gordon</surname><given-names>M.</given-names></name> <name><surname>Mireshghallah</surname><given-names>N.</given-names></name> <name><surname>Rytting</surname><given-names>C.- p. M.</given-names></name> <etal/></person-group>. (<year>2024</year>). &#x201C;<article-title>Position: A roadmap to pluralistic alignment</article-title>&#x201D; in <source>Proceedings of the 41st international conference on machine learning</source>, <fpage>46280</fpage>&#x2013;<lpage>46302</lpage>.</mixed-citation></ref>
<ref id="ref97"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Srivastava</surname><given-names>A.</given-names></name> <name><surname>Rastogi</surname><given-names>A.</given-names></name> <name><surname>Rao</surname><given-names>A.</given-names></name> <name><surname>Shoeb</surname><given-names>A. A.</given-names></name> <name><surname>Abid</surname><given-names>A.</given-names></name> <name><surname>Fisch</surname><given-names>A.</given-names></name> <etal/></person-group>. (<year>2023</year>). <article-title>Beyond the imitation game: quantifying and extrapolating the capabilities of language models</article-title>. <source>Transactions Machine Learning Research</source>.</mixed-citation></ref>
<ref id="ref98"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Staufer</surname><given-names>L.</given-names></name> <name><surname>Yang</surname><given-names>M.</given-names></name> <name><surname>Reuel</surname><given-names>A.</given-names></name> <name><surname>Casper</surname><given-names>S.</given-names></name></person-group> (<year>2025</year>). <article-title>Audit cards: contextualizing ai evaluations</article-title>. <source>arXiv preprint arXiv</source>.</mixed-citation></ref>
<ref id="ref99"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Stoltz</surname><given-names>D. S.</given-names></name> <name><surname>Taylor</surname><given-names>M. A.</given-names></name></person-group> (<year>2021</year>). <article-title>Cultural cartography with word embeddings</article-title>. <source>Poetics</source> <volume>88</volume>:<fpage>101567</fpage>. doi: <pub-id pub-id-type="doi">10.1016/j.poetic.2021.101567</pub-id></mixed-citation></ref>
<ref id="ref100"><mixed-citation publication-type="book"><person-group person-group-type="author"><name><surname>Szondi</surname><given-names>P.</given-names></name></person-group> (<year>1995</year>). <source>Introduction to literary hermeneutics</source>. <publisher-loc>Cambridge, UK</publisher-loc>: <publisher-name>Cambridge University Press</publisher-name>.</mixed-citation></ref>
<ref id="ref101"><mixed-citation publication-type="other"><person-group person-group-type="author"><name><surname>Tankelevitch</surname><given-names>L.</given-names></name> <name><surname>Kewenig</surname><given-names>V.</given-names></name> <name><surname>Simkute</surname><given-names>A.</given-names></name> <name><surname>Scott</surname><given-names>A. E.</given-names></name> <name><surname>Sarkar</surname><given-names>A.</given-names></name> <name><surname>Sellen</surname><given-names>A.</given-names></name> <etal/></person-group>. (<year>2024</year>). &#x201C;<article-title>The metacognitive demands and opportunities of generative AI</article-title>&#x201D; in <source>Proceedings of the 2024 CHI conference on human factors in computing systems</source>, <fpage>1</fpage>&#x2013;<lpage>24</lpage>.</mixed-citation></ref>
<ref id="ref102"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Tao</surname><given-names>Y.</given-names></name> <name><surname>Viberg</surname><given-names>O.</given-names></name> <name><surname>Baker</surname><given-names>R. S.</given-names></name> <name><surname>Kizilcec</surname><given-names>R. F.</given-names></name></person-group> (<year>2024</year>). <article-title>Cultural bias and cultural alignment of large language models</article-title>. <source>PNAS Nexus</source> <volume>3</volume>:<fpage>pgae346</fpage>. doi: <pub-id pub-id-type="doi">10.1093/pnasnexus/pgae346</pub-id>, <pub-id pub-id-type="pmid">39290441</pub-id></mixed-citation></ref>
<ref id="ref103"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Tomaszewska</surname><given-names>P.</given-names></name> <name><surname>Biecek</surname><given-names>P.</given-names></name></person-group> (<year>2024</year>). <article-title>Position: do not explain vision models without context</article-title>. <source>Proc. Mach. Learn. Res.</source> <volume>235</volume>.</mixed-citation></ref>
<ref id="ref104"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Tseng</surname><given-names>Y. S.</given-names></name></person-group> (<year>2023</year>). <article-title>Assemblage thinking as a methodology for studying urban AI phenomena</article-title>. <source>AI &#x0026; Soc.</source> <volume>38</volume>, <fpage>1099</fpage>&#x2013;<lpage>1110</lpage>.</mixed-citation></ref>
<ref id="ref105"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Turney</surname><given-names>P. D.</given-names></name> <name><surname>Pantel</surname><given-names>P.</given-names></name></person-group> (<year>2010</year>). <article-title>From frequency to meaning: vector space models of semantics</article-title>. <source>J. Artif. Intell. Res.</source> <volume>37</volume>, <fpage>141</fpage>&#x2013;<lpage>188</lpage>. doi: <pub-id pub-id-type="doi">10.1613/jair.2934</pub-id></mixed-citation></ref>
<ref id="ref106"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Underwood</surname><given-names>T.</given-names></name> <name><surname>Nelson</surname><given-names>L. K.</given-names></name> <name><surname>Wilkens</surname><given-names>M.</given-names></name></person-group> (<year>2025</year>). <article-title>Can language models represent the past without anachronism?</article-title> <source>arXiv preprint arXiv</source>.</mixed-citation></ref>
<ref id="ref107"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Varimalla</surname><given-names>N. R.</given-names></name> <name><surname>Xu</surname><given-names>Y.</given-names></name> <name><surname>Saakyan</surname><given-names>A.</given-names></name> <name><surname>Wang</surname><given-names>M. F.</given-names></name> <name><surname>Muresan</surname><given-names>S.</given-names></name></person-group> (<year>2025</year>). <article-title>VideoNorms: benchmarking cultural awareness of video language models</article-title>. <source>arXiv preprint arXiv:2510.08543.</source></mixed-citation></ref>
<ref id="ref108"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Vaswani</surname><given-names>A.</given-names></name> <name><surname>Shazeer</surname><given-names>N.</given-names></name> <name><surname>Parmar</surname><given-names>N.</given-names></name> <name><surname>Uszkoreit</surname><given-names>J.</given-names></name> <name><surname>Jones</surname><given-names>L.</given-names></name> <name><surname>Gomez</surname><given-names>A. N.</given-names></name> <etal/></person-group>. (<year>2017</year>). <article-title>Attention is all you need</article-title>. <source>Adv. Neural Inf. Process. Syst.</source> <volume>30</volume>.</mixed-citation></ref>
<ref id="ref109"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Veselovsky</surname><given-names>V.</given-names></name> <name><surname>Argin</surname><given-names>B.</given-names></name> <name><surname>Stroebl</surname><given-names>B.</given-names></name> <name><surname>Wendler</surname><given-names>C.</given-names></name> <name><surname>West</surname><given-names>R.</given-names></name> <name><surname>Evans</surname><given-names>J.</given-names></name> <etal/></person-group>. (<year>2025a</year>). <article-title>Localized cultural knowledge is conserved and controllable in large language models</article-title>. <source>arXiv preprint arXiv</source>.</mixed-citation></ref>
<ref id="ref110"><mixed-citation publication-type="confproc"><person-group person-group-type="author"><name><surname>Veselovsky</surname><given-names>V.</given-names></name> <name><surname>Stroebl</surname><given-names>B.</given-names></name> <name><surname>Bencomo</surname><given-names>G.</given-names></name> <name><surname>Arumugam</surname><given-names>D.</given-names></name> <name><surname>Schut</surname><given-names>L.</given-names></name> <name><surname>Narayanan</surname><given-names>A.</given-names></name> <etal/></person-group>. (<year>2025b</year>). <article-title>Hindsight merging: diverse data generation with language models</article-title>. In <conf-name>The 41st Conference on Uncertainty in Artificial Intelligence</conf-name>.</mixed-citation></ref>
<ref id="ref111"><mixed-citation publication-type="other"><person-group person-group-type="author"><name><surname>Weidinger</surname><given-names>L.</given-names></name> <name><surname>Mellor</surname><given-names>J.</given-names></name> <name><surname>Pegueroles</surname><given-names>B.</given-names></name> <name><surname>Marchal</surname><given-names>N.</given-names></name> <name><surname>Kumar</surname><given-names>R.</given-names></name> <name><surname>Lum</surname><given-names>K.</given-names></name> <etal/></person-group>. (<year>2024</year>). &#x201C;<article-title>Star: sociotechnical approach to red teaming language models</article-title>&#x201D; in <source>Proceedings of the 2024 conference on empirical methods in natural language processing</source>, <fpage>21516</fpage>&#x2013;<lpage>21532</lpage>.</mixed-citation></ref>
<ref id="ref112"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Weidinger</surname><given-names>L.</given-names></name> <name><surname>Rauh</surname><given-names>M.</given-names></name> <name><surname>Marchal</surname><given-names>N.</given-names></name> <name><surname>Manzini</surname><given-names>A.</given-names></name> <name><surname>Hendricks</surname><given-names>L. A.</given-names></name> <name><surname>Mateos-Garcia</surname><given-names>J.</given-names></name> <etal/></person-group>. (<year>2023</year>). <article-title>Sociotechnical safety evaluation of generative AI systems</article-title>. <source>arXiv preprint arXiv</source>.</mixed-citation></ref>
<ref id="ref113"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Yadav</surname><given-names>A.</given-names></name> <name><surname>Patel</surname><given-names>A.</given-names></name> <name><surname>Shah</surname><given-names>M.</given-names></name></person-group> (<year>2021</year>). <article-title>A comprehensive review on resolving ambiguities in natural language processing</article-title>. <source>AI Open</source> <volume>2</volume>, <fpage>85</fpage>&#x2013;<lpage>92</lpage>.</mixed-citation></ref>
<ref id="ref114"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Yang</surname><given-names>L.</given-names></name> <name><surname>Zhang</surname><given-names>Z.</given-names></name> <name><surname>Song</surname><given-names>Y.</given-names></name> <name><surname>Hong</surname><given-names>S.</given-names></name> <name><surname>Xu</surname><given-names>R.</given-names></name> <name><surname>Zhao</surname><given-names>Y.</given-names></name> <etal/></person-group>. (<year>2023</year>). <article-title>Diffusion models: a comprehensive survey of methods and applications</article-title>. <source>ACM Comput. Surv.</source> <volume>56</volume>, <fpage>1</fpage>&#x2013;<lpage>39</lpage>.</mixed-citation></ref>
<ref id="ref115"><mixed-citation publication-type="book"><person-group person-group-type="author"><name><surname>Yong Cao</surname><given-names>Y.</given-names></name> <name><surname>Li Zhou</surname><given-names>L.</given-names></name> <name><surname>Seolhwa Lee</surname><given-names>S.</given-names></name> <name><surname>Laura Cabello</surname><given-names>L.</given-names></name> <name><surname>Min Chen</surname><given-names>M.</given-names></name> <name><surname>Daniel Hershcovich</surname><given-names>D.</given-names></name></person-group> (<year>2023</year>). &#x201C;<article-title>Assessing cross- cultural alignment between ChatGPT and human societies: an empirical study</article-title>&#x201D; in <source>Proceedings of the first workshop on cross-cultural considerations in NLP (C3NLP)</source> (<publisher-loc>Dubrovnik, Croatia</publisher-loc>: <publisher-name>Association for Computational Linguistics</publisher-name>), <fpage>53</fpage>&#x2013;<lpage>67</lpage>.</mixed-citation></ref>
<ref id="ref116"><mixed-citation publication-type="journal"><person-group person-group-type="author"><name><surname>Zhao</surname><given-names>Y.</given-names></name> <name><surname>Zhang</surname><given-names>R.</given-names></name> <name><surname>Li</surname><given-names>W.</given-names></name> <name><surname>Li</surname><given-names>L.</given-names></name></person-group> (<year>2025</year>). <article-title>Assessing and understanding creativity in large language models</article-title>. <source>Mach. Intell. Res.</source> <volume>22</volume>, <fpage>417</fpage>&#x2013;<lpage>436</lpage>.</mixed-citation></ref>
<ref id="ref117"><mixed-citation publication-type="book"><person-group person-group-type="author"><name><surname>Zhou</surname><given-names>N.</given-names></name> <name><surname>Bamman</surname><given-names>D.</given-names></name> <name><surname>Bleaman</surname><given-names>I. L.</given-names></name></person-group> (<year>2025</year>). &#x201C;<article-title>Culture is not trivia: sociocultural theory for cultural NLP</article-title>&#x201D; in <source>Proceedings of the 63rd annual meeting of the Association for Computational Linguistics</source>, vol. <volume>1</volume> (<publisher-loc>Vienna, Austria</publisher-loc>: <publisher-name>Association for Computational Linguistics</publisher-name>), <fpage>25869</fpage>&#x2013;<lpage>25886</lpage>.</mixed-citation></ref>
</ref-list>
<fn-group>
<fn id="fn0001" fn-type="custom" custom-type="edited-by"><p>Edited by: <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/2768590/overview">Meital Amzalag</ext-link>, Holon Institute of Technology, Israel</p></fn>
<fn id="fn0002" fn-type="custom" custom-type="reviewed-by"><p>Reviewed by: <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/866774/overview">Gabriel Grill</ext-link>, IT:U Interdisciplinary Transformation University Austria, Austria</p><p><ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/1244688/overview">Josh Andres</ext-link>, University of New South Wales, Australia</p></fn>
</fn-group>
</back>
</article>