<?xml version="1.0" encoding="UTF-8" standalone="no"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.3 20070202//EN" "journalpublishing.dtd">
<article xml:lang="EN" xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" article-type="review-article">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Big Data</journal-id>
<journal-title>Frontiers in Big Data</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Big Data</abbrev-journal-title>
<issn pub-type="epub">2624-909X</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="doi">10.3389/fdata.2024.1467222</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Big Data</subject>
<subj-group>
<subject>Review</subject>
</subj-group>
</subj-group>
</article-categories>
<title-group>
<article-title>Establishing and evaluating trustworthy AI: overview and research challenges</article-title>
</title-group>
<contrib-group>
<contrib contrib-type="author" corresp="yes">
<name><surname>Kowald</surname> <given-names>Dominik</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
<xref ref-type="corresp" rid="c001"><sup>&#x0002A;</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/975410/overview"/>
<role content-type="https://credit.niso.org/contributor-roles/conceptualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/supervision/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Scher</surname> <given-names>Sebastian</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="aff" rid="aff3"><sup>3</sup></xref>
<role content-type="https://credit.niso.org/contributor-roles/investigation/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Pammer-Schindler</surname> <given-names>Viktoria</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/830956/overview"/>
<role content-type="https://credit.niso.org/contributor-roles/investigation/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
<contrib contrib-type="author">
<name><surname>M&#x000FC;llner</surname> <given-names>Peter</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/2200373/overview"/>
<role content-type="https://credit.niso.org/contributor-roles/investigation/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Waxnegger</surname> <given-names>Kerstin</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Demelius</surname> <given-names>Lea</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Fessl</surname> <given-names>Angela</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/2017613/overview"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Toller</surname> <given-names>Maximilian</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Mendoza Estrada</surname> <given-names>Inti Gabriel</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
<contrib contrib-type="author">
<name><surname>&#x00160;imi&#x00107;</surname> <given-names>Ilija</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/2871396/overview"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Sabol</surname> <given-names>Vedran</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Tr&#x000FC;gler</surname> <given-names>Andreas</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
<xref ref-type="aff" rid="aff3"><sup>3</sup></xref>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Veas</surname> <given-names>Eduardo</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Kern</surname> <given-names>Roman</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Nad</surname> <given-names>Tomislav</given-names></name>
<xref ref-type="aff" rid="aff4"><sup>4</sup></xref>
<role content-type="https://credit.niso.org/contributor-roles/investigation/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name><surname>Kopeinik</surname> <given-names>Simone</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="corresp" rid="c002"><sup>&#x0002A;</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/2535159/overview"/>
<role content-type="https://credit.niso.org/contributor-roles/conceptualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/supervision/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
</contrib-group>
<aff id="aff1"><sup>1</sup><institution>Know Center Research GmbH</institution>, <addr-line>Graz</addr-line>, <country>Austria</country></aff>
<aff id="aff2"><sup>2</sup><institution>Institute of Interactive Systems and Data Science, Graz University of Technology</institution>, <addr-line>Graz</addr-line>, <country>Austria</country></aff>
<aff id="aff3"><sup>3</sup><institution>Department of Geography and Regional Science, Wegener Center for Climate and Global Change, University of Graz</institution>, <addr-line>Graz</addr-line>, <country>Austria</country></aff>
<aff id="aff4"><sup>4</sup><institution>SGS Digital Trusts Services GmbH</institution>, <addr-line>Graz</addr-line>, <country>Austria</country></aff>
<author-notes>
<fn fn-type="edited-by"><p>Edited by: Jose Santamaria Lopez, University of Ja&#x000E9;n, Spain</p></fn>
<fn fn-type="edited-by"><p>Reviewed by: Luisa Varriale, University of Naples Parthenope, Italy</p>
<p>Reza Shahbazian, University of Calabria, Italy</p>
<p>Tim Hulsen, Philips, Netherlands</p></fn>
<corresp id="c001">&#x0002A;Correspondence: Dominik Kowald <email>dominik.kowald&#x00040;tugraz.at</email></corresp>
<corresp id="c002">Simone Kopeinik <email>skopeinik&#x00040;know-center.at</email></corresp>
</author-notes>
<pub-date pub-type="epub">
<day>29</day>
<month>11</month>
<year>2024</year>
</pub-date>
<pub-date pub-type="collection">
<year>2024</year>
</pub-date>
<volume>7</volume>
<elocation-id>1467222</elocation-id>
<history>
<date date-type="received">
<day>19</day>
<month>07</month>
<year>2024</year>
</date>
<date date-type="accepted">
<day>11</day>
<month>11</month>
<year>2024</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#x000A9; 2024 Kowald, Scher, Pammer-Schindler, M&#x000FC;llner, Waxnegger, Demelius, Fessl, Toller, Mendoza Estrada, &#x00160;imi&#x00107;, Sabol, Tr&#x000FC;gler, Veas, Kern, Nad and Kopeinik.</copyright-statement>
<copyright-year>2024</copyright-year>
<copyright-holder>Kowald, Scher, Pammer-Schindler, M&#x000FC;llner, Waxnegger, Demelius, Fessl, Toller, Mendoza Estrada, &#x00160;imi&#x00107;, Sabol, Tr&#x000FC;gler, Veas, Kern, Nad and Kopeinik</copyright-holder>
<license xlink:href="http://creativecommons.org/licenses/by/4.0/"><p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (CC BY). The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</p></license>
</permissions>
<abstract>
<p>Artificial intelligence (AI) technologies (re-)shape modern life, driving innovation in a wide range of sectors. However, some AI systems have yielded unexpected or undesirable outcomes or have been used in questionable manners. As a result, there has been a surge in public and academic discussions about aspects that AI systems must fulfill to be considered trustworthy. In this paper, we synthesize existing conceptualizations of trustworthy AI along six requirements: (1) human agency and oversight, (2) fairness and non-discrimination, (3) transparency and explainability, (4) robustness and accuracy, (5) privacy and security, and (6) accountability. For each one, we provide a definition, describe how it can be established and evaluated, and discuss requirement-specific research challenges. Finally, we conclude this analysis by identifying overarching research challenges across the requirements with respect to (1) interdisciplinary research, (2) conceptual clarity, (3) context-dependency, (4) dynamics in evolving systems, and (5) investigations in real-world contexts. Thus, this paper synthesizes and consolidates a wide-ranging and active discussion currently taking place in various academic sub-communities and public forums. It aims to serve as a reference for a broad audience and as a basis for future research directions.</p></abstract>
<kwd-group>
<kwd>trustworthy AI</kwd>
<kwd>artificial intelligence</kwd>
<kwd>fairness</kwd>
<kwd>human agency</kwd>
<kwd>robustness</kwd>
<kwd>privacy</kwd>
<kwd>accountability</kwd>
<kwd>transparency</kwd>
</kwd-group>
<counts>
<fig-count count="4"/>
<table-count count="1"/>
<equation-count count="0"/>
<ref-count count="212"/>
<page-count count="21"/>
<word-count count="19724"/>
</counts>
<custom-meta-wrap>
<custom-meta>
<meta-name>section-at-acceptance</meta-name>
<meta-value>Machine Learning and Artificial Intelligence</meta-value>
</custom-meta>
</custom-meta-wrap>
</article-meta>
</front>
<body>
<sec sec-type="intro" id="s1">
<title>1 Introduction</title>
<p>From sophisticated chatbots like Chat-GPT to AI-driven recommender systems enhancing our entertainment experiences on platforms like Netflix and Spotify (Anderson et al., <xref ref-type="bibr" rid="B13">2020</xref>), the impact of AI on our lives is significant. AI-based decision support systems are proving invaluable in critical fields such as life science and healthcare (Rajpurkar et al., <xref ref-type="bibr" rid="B152">2022</xref>). Similarly, AI is reshaping hiring and human resources practice (Van den Broek et al., <xref ref-type="bibr" rid="B183">2021</xref>) and transforming the banking and finance landscape with innovative solutions (Cao, <xref ref-type="bibr" rid="B47">2022</xref>). However, in the past, some AI systems have been used in questionable manners, which has led to unexpected or undesirable results. Examples include biased algorithms perpetuating discrimination in recruitment processes (Chen, <xref ref-type="bibr" rid="B53">2023</xref>) or AI-driven recommender systems favoring popular content and, with this, users interested in popular content (Kowald et al., <xref ref-type="bibr" rid="B105">2020</xref>; Kowald and Lacic, <xref ref-type="bibr" rid="B104">2022</xref>). Alongside biases in algorithms, AI systems rely on training data, including personal and private user information, which raises concerns for potential privacy and security breaches. One example is the Equifax data breach, in which private data records of millions of users were compromised (Zou and Schaub, <xref ref-type="bibr" rid="B212">2018</xref>). Additionally, when thinking of self-driving cars, unreliable AI-based systems could even cause physical harm, as demonstrated by the unfortunate Uber car crash in 2018, in which a malfunctioning algorithm did not detect and, as a consequence, killed a pedestrian on the road (Kohli and Chadha, <xref ref-type="bibr" rid="B101">2020</xref>).</p>
<p>As a consequence, there has been an increase in public and academic discussions about the essential requirements AI systems must fulfill to be considered trustworthy. There is also a growing consensus on the necessity of setting up standards and regulations to ensure and validate the trustworthiness of AI. In this respect, the European Commission (EC) has proposed the AI Act (Madiega, <xref ref-type="bibr" rid="B118">2021</xref>), a comprehensive regulatory framework for supporting the responsible development and deployment of AI technologies within the European Union. The AI Act seeks to establish clear rules governing the development and deployment of AI systems while imposing strict requirements for high-risk AI applications. The various interpretations of trustworthy AI add further complexity to this discourse by encompassing not just technical requirements but also human-centered and legal considerations. Another important framework proposed by the European Commission has been the &#x0201C;Assessment List for Trustworthy AI (ALTAI)&#x0201D; (Ala-Pietil&#x000E4; et al., <xref ref-type="bibr" rid="B7">2020</xref>; Radclyffe et al., <xref ref-type="bibr" rid="B151">2023</xref>), which enables organizations to self-assess the trustworthiness of AI solutions based on a checklist.</p>
<p>This paper contributes insights into this discourse by analyzing the state-of-the-art regarding six aspects of AI systems that are typically understood as requirements for systems to be viewed as trustworthy. These requirements are: (1) human agency and oversight, (2) fairness and non-discrimination, (3) transparency and explainability, (4) robustness and accuracy, (5) privacy and security, and (6) accountability (see <xref ref-type="fig" rid="F1">Figure 1</xref>). We define each of these six requirements, introduce methods to establish and implement these requirements in AI systems, and discuss corresponding validation methods and evaluation metrics. Such validation efforts are crucial from scientific and practical perspectives and might serve as a prerequisite for certifying AI systems and models (Winter et al., <xref ref-type="bibr" rid="B197">2021</xref>). Finally, for each of these requirements, we outline ongoing research challenges and future research perspectives.</p>
<fig id="F1" position="float">
<label>Figure 1</label>
<caption><p>An illustration of the six requirements of trustworthy AI investigated in this paper.</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fdata-07-1467222-g0001.tif"/>
</fig>
<p>The contributions of our work are two-fold: firstly, we give a comprehensive overview of the requirements of trustworthy AI, in which we cover different viewpoints on trustworthy AI, including technical and also human-centered and legal considerations. Secondly, we discuss open issues and challenges in defining, establishing, and evaluating these requirements of trustworthy AI. Therefore, the guiding research question of this work is defined as follows: <italic>What is the current state of research regarding the establishment and evaluation of comprehensive - technical, human-centered, and legal - requirements of trustworthy AI?</italic> To address this research question, we follow the methodology described in Section 2.3.</p>
<p>Our work complements existing surveys and articles on trustworthy AI in two main ways. Firstly, existing overview articles such as Chatila et al. (<xref ref-type="bibr" rid="B52">2021</xref>); Thiebes et al. (<xref ref-type="bibr" rid="B181">2021</xref>); Akbar et al. (<xref ref-type="bibr" rid="B5">2024</xref>); D&#x00301;&#x00131;az-Rodr&#x00301;&#x00131;guez et al. (<xref ref-type="bibr" rid="B57">2023</xref>) tend to focus on definitions of trustworthy AI and neglect evaluation aspects, which is one key aspect of our article. Specifically, related surveys such as Liang et al. (<xref ref-type="bibr" rid="B113">2022</xref>); Wing (<xref ref-type="bibr" rid="B196">2021</xref>); Emaminejad and Akhavian (<xref ref-type="bibr" rid="B65">2022</xref>) focus on specific aspects of trustworthy AI implementation and evaluation, namely data, formal methods, and robotics, respectively. In contrast, our article aims to provide a domain- and method-independent overview of trustworthy AI, which reflects the whole AI-lifecycle, including the evaluation phase. Secondly, concerning validation and evaluation schemes for trustworthy AI, existing technical conceptualizations of trustworthy AI such as Floridi (<xref ref-type="bibr" rid="B73">2021</xref>); Kaur et al. (<xref ref-type="bibr" rid="B98">2022</xref>); Li et al. (<xref ref-type="bibr" rid="B111">2023</xref>) have focused on technical and reliability-oriented requirements such as transparency, privacy, and robustness. In contrast, in our paper, we discuss methods and open challenges toward establishing and evaluating trustworthy AI also through the lens of human-centric and legal requirements such as fairness, accountability, and human agency. Therefore, to the best of our knowledge, our paper is the first to investigate all six requirements of trustworthy AI in a unified way by discussing implementation and evaluation aspects across the whole lifecycle of trustworthy AI and outlining open research challenges and issues for all six requirements.</p>
<p>Our article shows that while evaluation and validation methodologies for technical requirements like robustness may rely on established metrics and testing procedures (e.g., for model accuracy), the assessment of human-centric considerations often requires more nuanced approaches that consider ethical, legal, and cultural factors. As such, our article emphasizes the need for further research to develop robust evaluation schemes that can be applied in research and practice across a variety of AI systems, particularly in high-risk domains where human values and rights are at stake (e.g., healthcare).</p>
<p>Next, in Section 2, we describe the relevant background for this article, including general definitions of AI and its lifecycle, and introduce the six requirements of trustworthy AI covered herein. After discussing each requirement separately in Section 3, the paper closes with a conclusion and an outlook into future research directions in Section 4.</p></sec>
<sec id="s2">
<title>2 Background</title>
<p>In this section, we give a short overview of definitions and preliminaries relevant to our article, introduce the six requirements of trustworthy AI discussed, and describe the methodology of our investigation.</p>
<sec>
<title>2.1 Definitions and preliminaries of trustworthy AI</title>
<p>For our understanding of AI in the context of this work, we adhere to the definition outlined in the EU AI Act (adopted text, Art 3(1),<xref ref-type="fn" rid="fn0001"><sup>1</sup></xref>), in which AI is defined as &#x0201C;<italic>a machine-based system designed to operate with varying levels of autonomy and that may exhibit adaptiveness after deployment and that, for explicit or implicit objectives, infers, from the input it receives, how to generate outputs such as predictions, content, recommendations, or decisions that can influence physical or virtual environments</italic>.&#x0201D; This definition encompasses a broad spectrum of algorithmic implementations, from simple logistic regression models to complex machine-learning approaches. In the article at hand, we consider this spectrum of AI systems, recognizing the diverse challenges and requirements that are associated with ensuring its trustworthiness.</p>
<p>Additionally, we aim to consider the trustworthiness of AI from a holistic perspective that can be influenced in all phases of the AI-lifecycle, as thoroughly described in Haakman et al. (<xref ref-type="bibr" rid="B83">2021</xref>) (see <xref ref-type="fig" rid="F2">Figure 2</xref>). These phases encompass the design, development, and deployment of AI-based systems and their designated tasks. While discussing the requirements of trustworthy AI, we refer to the phases where needed in this article. To comply with trustworthy AI, special attention should be paid to considering AI requirements in the <italic>design phase</italic> throughout requirements engineering, problem understanding, and data collection strategies, the <italic>development phase</italic>, comprising model implementation (e.g., optimizing feature weights), documentation, and evaluation, and finally, the <italic>deployment phase</italic> including the integration of the AI model into a production environment, and the continuous monitoring and updating of the model.</p>
<fig id="F2" position="float">
<label>Figure 2</label>
<caption><p>The AI-lifecycle. The trustworthiness of AI can be conflicted in all phases&#x02014;the design phase, the development phase, and the deployment phase.</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fdata-07-1467222-g0002.tif"/>
</fig></sec>
<sec>
<title>2.2 Requirements of trustworthy AI</title>
<p>Over the last years, various frameworks, guidelines, survey articles, and collections of requirements of trustworthy AI have been developed and published by researchers, governments, and private organizations (Smuha, <xref ref-type="bibr" rid="B173">2019</xref>; Kaur et al., <xref ref-type="bibr" rid="B97">2021</xref>; Floridi, <xref ref-type="bibr" rid="B73">2021</xref>; Kaur et al., <xref ref-type="bibr" rid="B98">2022</xref>; Li et al., <xref ref-type="bibr" rid="B111">2023</xref>; Yeung, <xref ref-type="bibr" rid="B201">2020</xref>). Although these investigations differ with respect to the exact wordings, they agree on four fundamental principles that need to be considered when developing and validating trustworthy AI: (1) respect for human autonomy, (2) fairness, (3) explicability, and (4) prevention of harm (Smuha, <xref ref-type="bibr" rid="B173">2019</xref>; Kaur et al., <xref ref-type="bibr" rid="B97">2021</xref>, <xref ref-type="bibr" rid="B98">2022</xref>). In the following, we describe six requirements of trustworthy AI that are manifested within these principles.</p>
<p>Hereinafter, principle 1 (respect for human control) is mainly associated with <bold>human agency and oversight</bold> (requirement 1, see Section 3.1), which refers to sustaining the autonomy of humans affected by AI systems, given different levels of human-AI interaction. The second principle (fairness) aims for the equal treatment of all affected individuals and subpopulations (i.e., defined by age, gender, education, ...). <bold>Fairness and non-discrimination</bold> (requirement 2, see Section 3.2) describes the absence of bias in AI decisions that could result in unfair, unequal treatment that negatively affects certain people. Next, principle 3 (explicability) ensures the AI system is transparent and explainable. In particular, <bold>transparency and explainability</bold> (requirement 3, see Section 3.3) is defined as the understandability of an AI system and the provision of information to explain the AI model&#x00027;s decisions.</p>
<p>Finally, principle 4 (prevention of harm) should ensure that the AI system does not cause any harm to humans, society, or the environment. For example, it should be prevented that AI-based systems harm or, even worse, kill humans, which unfortunately has happened, e.g., in the aforementioned Uber car crash in 2018, in which a pedestrian was killed by a malfunctioned self-driving car (Kohli and Chadha, <xref ref-type="bibr" rid="B101">2020</xref>). This principle includes a range of requirements, including technical and legal concerns. An essential technical requirement within this principle is <bold>robustness and accuracy</bold> (requirement 4, see Section 3.4), which is related to the performance of AI models and their ability to function in unexpected circumstances. Additionally, the principle &#x0201C;prevention of harm&#x0201D; is linked to <bold>privacy and security</bold> (requirement 5, see Section 3.5) that focuses on protecting the personal and sensitive information of users in AI systems and on preventing malicious attacks on AI models. Concerning legal aspects, <bold>accountability</bold> (requirement 6, see Section 3.6) entails the understanding of who is responsible for the decisions of AI systems and to ensure that mechanisms are in place to interfere with negative consequences. The literature (e.g., Kaur et al., <xref ref-type="bibr" rid="B97">2021</xref>; Smuha, <xref ref-type="bibr" rid="B173">2019</xref>) also discusses other important requirements of trustworthy AI within this principle, such as safety, reproducibility, sustainability, societal and environmental wellbeing, and data governance. While we highlight these requirements&#x00027; significance, we believe they serve as overarching aspects that underpin the six other requirements of trustworthy AI discussed in this article. However, we strongly suggest a foundational commitment to safety, reproducibility, sustainability, societal and environmental wellbeing, and data governance when developing and validating trustworthy AI. In the next section, we discuss in detail these six requirements outlined above.</p></sec>
<sec>
<title>2.3 Methodology</title>
<p>To collect relevant resources, we conduct an exploratory approach to define the research field and, for the main part, follow a semi-structured literature review (Snyder, <xref ref-type="bibr" rid="B174">2019</xref>). This allows the consideration of interdisciplinary literature to (1) specify a comprehensive set of aspects of trustworthiness in AI, (2) synthesize available knowledge regarding these aspects that is relevant when aiming to design, implement, and evaluate trustworthy AI, and (3) identify open challenges and knowledge gaps in these regards. Thus, we conducted exploratory literature research on trustworthy AI in general, which resulted in the six herein-discussed requirements. Then, the following procedure was completed for each requirement: (1) a Scopus search for conference papers, articles, and reviews, (2) the screening of the 100 most relevant abstracts as ranked by Scopus, (3) the screening of the remaining papers, and the extraction of relevant content, (4) snowballing and additional search in Google Scholar to close information gaps.</p>
<p>The goal of this paper was not to cover all existing publications of the field but rather to generate a comprehensive understanding of relevant research directions and their existing challenges. Therefore, we excluded articles with over-specialization, such as solutions only applicable to specific use cases or domains, and articles with limited contributions. This resulted in a collection of 183 papers as illustrated in <xref ref-type="fig" rid="F3">Figure 3</xref>.</p>
<fig id="F3" position="float">
<label>Figure 3</label>
<caption><p>The number of publications per requirement included in this paper across publication years. We investigate 183 publications: 20 publications for <italic>human agency and oversight</italic>, 35 publications for <italic>fairness and non-discrimination</italic>, 47 publications for <italic>Transparency and explainability</italic>, 21 publications for <italic>robustness and accuracy</italic>, 37 publications for <italic>privacy and security</italic>, and 23 publications for <italic>accountability</italic>.</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fdata-07-1467222-g0003.tif"/>
</fig>
</sec>
</sec>
<sec id="s3">
<title>3 Overview and discussion of trustworthy AI requirements</title>
<p>In the following, we discuss six requirements an AI-based system should meet to be considered trustworthy. Each requirement is first defined, then we describe methods to establish and evaluate it, and finally, we debate open issues and research challenges. <xref ref-type="table" rid="T1">Table 1</xref> provides a complementary illustration of the problem definitions of these six requirements.</p>
<table-wrap position="float" id="T1">
<label>Table 1</label>
<caption><p>Problem definitions of the six trustworthy AI requirements investigated in this paper.</p></caption>
<table frame="box" rules="all">
<thead>
<tr style="background-color:#919498;color:#ffffff">
<th valign="top" align="left"><bold>Trustworthy AI requirement</bold></th>
<th valign="top" align="left"><bold>Problem definition</bold></th>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left">Human agency and oversight</td>
<td valign="top" align="left">Sustaining the autonomy of humans affected by AI systems</td>
</tr> <tr>
<td valign="top" align="left">Fairness and non-discrimination</td>
<td valign="top" align="left">Mitigating bias in AI decisions to prevent unfair treatment</td>
</tr> <tr>
<td valign="top" align="left">Transparency and explainability</td>
<td valign="top" align="left">Improving the understandability of an AI system and its decisions</td>
</tr> <tr>
<td valign="top" align="left">Robustness and accuracy</td>
<td valign="top" align="left">Sustaining the model&#x00027;s performance (in unexpected circumstances)</td>
</tr> <tr>
<td valign="top" align="left">Privacy and security</td>
<td valign="top" align="left">Protecting personal information of users in AI systems</td>
</tr> <tr>
<td valign="top" align="left">Accountaibility</td>
<td valign="top" align="left">Understanding who is responsible for the decisions of AI systems</td>
</tr></tbody>
</table>
</table-wrap>
<sec>
<title>3.1 Requirement 1: human agency and oversight</title>
<sec>
<title>3.1.1 Definition of human agency and oversight</title>
<p>The principle of human agency and oversight refers to the idea that AI systems should uphold individual autonomy and dignity, and need to operate in a way that allows for substantial human control over the AI system&#x00027;s impact on people and society. This principle further postulates that AI systems should contribute to a democratic, flourishing, and equitable society and allow for human supervision to foster fundamental rights and ethical norms (High-Level Expert Group on AI, <xref ref-type="bibr" rid="B90">2019</xref>).</p>
<p>Although the terms <italic>human agency</italic> and <italic>human oversight</italic> are very alike and sometimes used as synonymous, they are not interchangeable (Bennett et al., <xref ref-type="bibr" rid="B28">2023</xref>). In this paper, we understand the term and concept <italic>human agency</italic> as referring to the very broad idea that humans as intentional actors should be in control, particularly with respect to substantial and important parts of their lives (High-Level Expert Group on AI, <xref ref-type="bibr" rid="B90">2019</xref>). AI systems shall not restrict this agency; rather, it would be desirable that through AI systems, human agency is increased. AI systems could, for instance, limit human agency by deceiving or manipulating users. However, users should be able to influence automated decisions and to fairly evaluate or question the AI system. Consequently, users who are impacted by AI systems or who oversee AI systems need to be able to acquire or to be equipped with related competencies and skills (AI Literacy) to understand and engage with AI systems to a satisfying degree (Long and Magerko, <xref ref-type="bibr" rid="B116">2020</xref>; Pammer-Schindler and Lindstaedt, <xref ref-type="bibr" rid="B144">2022</xref>).</p>
<p>The term and concept of <italic>human oversight</italic> is more specifically related to how AI systems are used and suggests that AI systems do not operate entirely autonomously, but instead, humans should oversee the way AI systems &#x0201C;work&#x0201D; within a more extensive process. This concept, therefore, is concerned with forms of human-AI interaction or collaboration, postulating that humans should be in a supervisory and decision-making role. Human oversight activities include observing, interpreting, and interfering in AI operations. Human oversight can be understood as a specific approach to facilitating human agency.</p>
<p>Long and Magerko (<xref ref-type="bibr" rid="B116">2020</xref>) define AI literacy as <italic>"a set of competencies that enables individuals to evaluate AI technologies critically; communicate and collaborate effectively with AI; and use AI as a tool online, at home, and in the workplace."</italic> Being AI literate means having a basic understanding of AI that empowers users to better interact with AI systems as they are able to judge the outcomes provided and, at the same time, to retain autonomy and agency (Hermann, <xref ref-type="bibr" rid="B89">2022</xref>). Facilitating AI literacy on a large scale is currently a subject both of research (Ng et al., <xref ref-type="bibr" rid="B138">2021</xref>) and of public endeavor.</p></sec>
<sec>
<title>3.1.2 Methods to establish human agency and oversight</title>
<p>Very broadly speaking, socio-technical and human-centric design methods (Baxter and Sommerville, <xref ref-type="bibr" rid="B26">2010</xref>) are approaches for designing (AI-based) systems that can systematically consider human users and people impacted, from the very early stage of designing the systems (Dennerlein et al., <xref ref-type="bibr" rid="B56">2020</xref>). The consideration of human factors in the design phase of the AI-lifecycle (see <xref ref-type="fig" rid="F2">Figure 2</xref>) responds well to the complex dynamics of the issues. Humans can interact with AI in various ways, which may require different levels of human agency and oversight. Anders et al. (<xref ref-type="bibr" rid="B12">2022</xref>) propose to think of different patterns of human engagement with AI-based operations and decisions as follows, sorted along the decreasing involvement of humans:</p>
<list list-type="bullet">
<list-item><p><italic>Human-in-command</italic>: Humans manage and oversee an AI system&#x00027;s overall operation, including its wider impact on society, economy, law, and ethics. Decisions at a high level are made on when and how to use an AI system (Anderson and Fort, <xref ref-type="bibr" rid="B14">2022</xref>). For example, regulatory bodies set ethical guidelines for the deployment of AI systems in healthcare to ensure patient safety and data privacy.</p></list-item>
<list-item><p><italic>Human-in-the-loop</italic>: Humans can intervene in AI-based decisions as well as in different steps of the underlying (typically machine learning based) algorithms (Mosqueira-Rey et al., <xref ref-type="bibr" rid="B128">2023</xref>; Munro, <xref ref-type="bibr" rid="B133">2021</xref>). In medical diagnostics, for example, an AI system can suggest potential diagnoses, but a physician reviews and decides on the diagnosis and treatment plan. Note that often, this kind of human-computer collaboration is not possible or even desired (High-Level Expert Group on AI, <xref ref-type="bibr" rid="B90">2019</xref>).</p></list-item>
<list-item><p><italic>Human-on-the-loop</italic>: Humans can intervene through (re-)designing the AI system or through involvement in system operations, where their role is primarily on monitoring (Anderson and Fort, <xref ref-type="bibr" rid="B14">2022</xref>). For example, a human operator may remotely monitor the performance of an autonomous vehicle and intervene only in emergency situations.</p></list-item>
<list-item><p><italic>Human-out-of-the-loop</italic>: Humans do not intervene. This could mean allowing an AI-based system to work without human involvement for specific tasks or in a completely automated manner. For example, in fully automated sections of vehicle production assembly lines, car parts can be assembled without human interaction.</p></list-item>
</list>
<p>Other authors categorize the spectrum of involvement in the design and operations of AI-based systems differently. For instance, Fanni et al. (<xref ref-type="bibr" rid="B70">2020</xref>) suggests a distinction between active and passive agency. Passive agency occurs when there are limited or no communication features that provide explanations for the decisions made by the AI system, or when users are uninformed about the potential consequences of AI interventions. This passive agency relates to the concepts of human-out-of-the-loop and human-on-the-loop. In contrast, active agency refers to situations where humans play a critical role in the design and operations of the AI-based system. This relates to human-in-the-loop and human-in-command approaches. Wang B. Y. et al. (<xref ref-type="bibr" rid="B188">2023</xref>) proposes the level of involvement to be defined by decisions and actions undertaken by humans and by AI-based systems. The author provides an example pattern of human-AI interaction as &#x0201C;AI Suggests, Human Intelligence (HI) Decides&#x0201D;, which can be interpreted such that the AI is providing recommendations, but humans are taking the role of final decision makers. Overall, thinking about such patterns of human-AI interaction allows deciding&#x02014;at the time of designing and using an AI-based system&#x02014;what kind of interaction is desirable or possible. Finally, we introduce the notion of AI literacy as positively contributing to human agency and oversight. This applies to both the users of AI-based systems and the decision-makers responsible for regulating and deciding which systems are used and how or what AI-related competencies users need to deal with AI systems.</p>
<p>AI literacy can be obtained in two dominant ways. First, through education in AI, particularly about everyday activities and technology (Zimmerman, <xref ref-type="bibr" rid="B210">2018</xref>). Such education can also be mediated by technology. For instance, researchers are engaging young learners in creative programming activities, including AI (Kahn and Winters, <xref ref-type="bibr" rid="B96">2017</xref>; Zimmermann-Niefield et al., <xref ref-type="bibr" rid="B211">2019</xref>). Secondly, everyday AI systems could be designed to support users in being or becoming AI literate. Long and Magerko (<xref ref-type="bibr" rid="B116">2020</xref>) outlined 15 concrete design considerations to promote users&#x00027; understanding and learning when interacting with AI systems. For example, AI systems could provide visualizations and explanations of decision-making processes to enhance users&#x00027; comprehension. They could also offer users the opportunity to learn about the system&#x00027;s reasoning processes by putting themselves &#x0201C;in the agent&#x00027;s shoes&#x0201D;; to encourage users to investigate the used data in terms of source, data collection processes, and known limitations or encourage users &#x0201C;<italic>to be critical consumers of AI technologies by questioning their intelligence and trustworthiness&#x0201D;</italic>. Such support of AI literacy by AI systems is precious, as complex knowledge is highly context- and activity-dependent, and transferring knowledge from one context or activity to another can be quite challenging (Eraut, <xref ref-type="bibr" rid="B66">2004</xref>).</p>
<p>Overall, systems need to be designed to be understandable for humans (Long and Magerko, <xref ref-type="bibr" rid="B116">2020</xref>; Ng et al., <xref ref-type="bibr" rid="B138">2021</xref>). This relates to the long-standing concepts of usability and learnability of systems. Finally, some of the above-described concepts, such as explaining decision-making, are essential for supporting transparency and explainability (see Section 3.3).</p></sec>
<sec>
<title>3.1.3 Methods to evaluate human agency and oversight</title>
<p>Building upon the previous discussion of human agency, human oversight, and AI literacy and their interrelations, we propose considering evaluation as moving upward the hierarchy of dependencies:</p>
<list list-type="bullet">
<list-item><p><italic>AI literacy:</italic> AI literacy of relevant stakeholders is considered a prerequisite for human agency and oversight. This level can be assessed, for instance, through knowledge or competency tests, by checking certifications and formal degrees, or by investigating educational opportunities that relevant stakeholders have accessed or utilized.</p></list-item>
<list-item><p><italic>System understandability:</italic> It is critical to evaluate whether the AI-based system or functionality communicates understandably how it operates and what effects user actions might have. This relates to established concepts of usability and learnability and newer, AI-specific concepts like transparency and explainability (see Section 3.3).</p></list-item>
<list-item><p><italic>Human oversight:</italic> It needs to be established whether and how the intended interaction pattern of human oversight is present in the evaluation setting. This evaluation level concerns observing the designed activity, with a focus on establishing whether humans are, reasonably and in an engaged manner, involved in the process, either in-the-loop, on-the-loop, or in-command.</p></list-item>
<list-item><p><italic>Human agency:</italic> This is probably the most challenging concept to verify. One could argue that the existence and evaluation of a human-centric and socio-technical (AI) design process implies a certain level of human agency. The discussions led during this process could provide insights into how human agency is conceptualized and implemented in the AI-based system. In the inverse, it may be possible to establish its absence, i.e., when it becomes noticeable that human agency is limited through an AI-based system or functionality.</p></list-item>
</list></sec>
<sec>
<title>3.1.4 Open issues and research challenges</title>
<p>Challenges concern the <italic>conceptualization of human agency, oversight, and AI literacy</italic> as interwoven concepts, and the operationalization in design patterns of (interfaces for) AI. Such developments will need to be made in relation to maturing technology such as increasing shop-floor automation at the conjunction of Internet of Things and AI-enabled data analytics, or the usage of generative AI across many sectors of knowledge-based and creative work. Additionally, more and better synthesized <italic>design-oriented knowledge that captures how to design for human agency, oversight, and AI literacy</italic> is pending. To date, research is revisiting the value of these design principles, e.g., in the context of AI (Long and Magerko, <xref ref-type="bibr" rid="B116">2020</xref>) or generative AI (Simkute et al., <xref ref-type="bibr" rid="B170">2024</xref>; Weisz et al., <xref ref-type="bibr" rid="B193">2024</xref>). However, these design principles need clearer examples of how to operationalize them concretely within applications. Finally, due to the unclear conceptualization and the plethora of different designs with little grouping into overarching design patterns, <italic>the evaluation of human agency, oversight, and AI literacy</italic> will remain challenging. Evaluations will also need to uncover how these concepts interact with design patterns, ethics, and trust in AI systems (High-Level Expert Group on AI, <xref ref-type="bibr" rid="B90">2019</xref>), actual decisions made in the domain of interest, and the overall socio-technical system performance (i.e., how good are decisions in the broader context and for whom).</p></sec></sec>
<sec>
<title>3.2 Requirement 2: fairness and non-discrimination</title>
<sec>
<title>3.2.1 Definition of fairness and non-discrimination</title>
<p>As AI products are being increasingly used in various fields and domains, their influence and impact on society are discussed not only in the machine learning community (e.g., Righetti et al., <xref ref-type="bibr" rid="B156">2019</xref>) but also among the general public. AI may negatively impact individuals and society by reproducing existing societal stereotypes that can adversely affect vulnerable groups (Dubal, <xref ref-type="bibr" rid="B59">2023</xref>). The unjust treatment of specific populations or individuals is particularly concerning in sensitive fields such as criminal justice, employment, education, or health, as it can result in significant consequences such as being refused medical care (Seyyed-Kalantari et al., <xref ref-type="bibr" rid="B166">2021</xref>) or educational opportunity (Chang et al., <xref ref-type="bibr" rid="B51">2021</xref>). Previous instances of such misconduct have been documented, including Google Ads showing lower-paid jobs to women and minority groups,<xref ref-type="fn" rid="fn0002"><sup>2</sup></xref> Apple Card granting lower credit limits to women than equally qualified men,<xref ref-type="fn" rid="fn0003"><sup>3</sup></xref> and commercial facial recognition systems performing poorly for women with black skin (Buolamwini and Gebru, <xref ref-type="bibr" rid="B43">2018</xref>).</p>
<p>People&#x00027;s perception of fairness strongly depends on the context, which can include various factors, such as socio-political views, personal preferences, or the particular context and use case (Saxena, <xref ref-type="bibr" rid="B162">2019</xref>). Especially in AI systems, achieving fairness is a multifaceted problem. Algorithmic fairness describes the absence of bias in AI decisions that would favor or disadvantage a person or group in a way that is considered unfair in the context of the application (Ntoutsi et al., <xref ref-type="bibr" rid="B142">2020</xref>; Srivastava et al., <xref ref-type="bibr" rid="B175">2019</xref>). Bias, often also called &#x0201C;discriminatory&#x0201D; or &#x0201C;unfair&#x0201D; bias, refers to outcomes of disproportionate advantage or disadvantage for a specific group of individuals, i.e., &#x0201C;<italic>systematic discrimination combined with an unfair outcome is considered bias</italic>&#x0201D; (Bird et al., <xref ref-type="bibr" rid="B33">2019</xref>). Consequently, we refer to fairness as the absence of discriminatory or &#x0201C;unfair&#x0201D; bias toward individuals, items, or groups.</p>
<p>Although ethical concerns are often at the forefront of public discourse, &#x0201C;unfair&#x0201D; bias can significantly impact society and businesses, even in seemingly non-critical domains. Therefore, it is crucial to consider the various risks from a business perspective. According to a report by Fancher et al. (<xref ref-type="bibr" rid="B69">2021</xref>), biased AI bears risk for several negative consequences. These include missing out on potential business opportunities, damaging reputation, and facing regulatory and compliance issues. One example of missing out on opportunities is when a recommender system only benefits a particular user group (Kowald and Lacic, <xref ref-type="bibr" rid="B104">2022</xref>). While the members of the advantaged group may find the system useful, other groups don&#x00027;t experience the same level of system performance and stop using the product. This results in a loss of potential customers for the platform provider. Another consequence of biased AI is reputational damage, especially when the technology fails to address sensitive societal issues. For instance, using face recognition software that only works well for parts of the ethnicities in the user population will likely lead to negative public perception and backlash against the company. Finally, in cases where anti-discrimination laws govern the use of AI, such as in the job market, unfair algorithms can lead to legal problems. For example, an HR system that discriminates based on gender, age, or race can result in fines and penalties for the company. More information on accountability can be found in Section 3.6.</p>
<p>Furthermore, the issue of bias and fairness is complex because bias is naturally inherent in human behavior (Houwer, <xref ref-type="bibr" rid="B92">2019</xref>) and thus, &#x0201C;unfair&#x0201D; bias can be introduced in every stage of the AI-lifecycle, as illustrated in Section 2. This problem becomes even more challenging in evolving AI systems because they can potentially reinforce bias between the user population, data, and algorithm (Baeza-Yates, <xref ref-type="bibr" rid="B20">2018</xref>). Thus, monitoring and addressing &#x0201C;unfair&#x0201D; bias throughout the entire AI-lifecycle is essential.</p></sec>
<sec>
<title>3.2.2 Methods to establish fairness and non-discrimination</title>
<p>A wide range of methods has been proposed to increase fairness in AI models (Bellamy et al., <xref ref-type="bibr" rid="B27">2019</xref>; Barocas et al., <xref ref-type="bibr" rid="B23">2021</xref>). Because fairness strongly depends on the context, making AI models fair means making them fair in a particular context, i.e., according to an appropriate definition of fairness (Srivastava et al., <xref ref-type="bibr" rid="B175">2019</xref>). Depending on their application level in the AI-lifecycle, &#x0201C;bias mitigation approaches&#x0201D; or &#x0201C;fairness enhancing methods&#x0201D;, are commonly grouped into three categories (Bellamy et al., <xref ref-type="bibr" rid="B27">2019</xref>; Pessach and Shmueli, <xref ref-type="bibr" rid="B147">2023</xref>; Barocas et al., <xref ref-type="bibr" rid="B24">2023</xref>):</p>
<list list-type="order">
<list-item><p><italic>Pre-processing</italic> concerns improving the training data&#x00027;s quality and balancing its composition in regard to protected groups. This can be applied independent of the AI algorithm. Pre-processing can regulate fairness in acceptance rates but does not cater to other fairness constraints. Examples of pre-processing algorithms include reweighting (Calders et al., <xref ref-type="bibr" rid="B45">2009</xref>), optimized preprocessing (Calmon et al., <xref ref-type="bibr" rid="B46">2017</xref>), learning fair representations (Zemel et al., <xref ref-type="bibr" rid="B205">2013</xref>), and disparate impact removal (Feldman et al., <xref ref-type="bibr" rid="B71">2015</xref>).</p></list-item>
<list-item><p><italic>In-processing</italic> describes the design and optimization of an AI algorithm toward an explicitly defined, fair solution. Thus, it incorporated fairness in the training algorithms themselves and can only be applied to specific algorithms/models that are well-understood (Srivastava et al., <xref ref-type="bibr" rid="B175">2019</xref>).</p></list-item>
<list-item><p><italic>Post-processing</italic> aims to adapt the AI model&#x00027;s results toward a balanced distribution for protected groups. Examples thereof include methods for calibration, constraint optimization, or setting thresholds for the maximum accuracy differences between groups (Pleiss et al., <xref ref-type="bibr" rid="B149">2017</xref>).</p></list-item>
</list>
<p>While each approach has its particular pros and cons, all of them potentially negatively affect the models&#x00027; accuracy (see Section 3.4).</p></sec>
<sec>
<title>3.2.3 Methods to evaluate fairness and non-discrimination</title>
<p>The auditing or evaluation of algorithmic fairness can, similar to the mitigation strategies, be approached according to the three main phases of the AI-lifecycle, i.e., design, development, and deployment (Koshiyama et al., <xref ref-type="bibr" rid="B103">2021</xref>). Examples of what can be assessed are (1) population balance and fair representation in data (design), (2) the implementation of fairness constraints in modeling or the adherence to fairness metrics in evaluation (development), and (3) the adherence to fairness metrics in real-time monitoring (deployment) (Akula and Garibay, <xref ref-type="bibr" rid="B6">2021</xref>).</p>
<p>Measures of algorithmic bias are a quantitative evaluation of the result set of the system at hand (Pessach and Shmueli, <xref ref-type="bibr" rid="B147">2023</xref>). The highest level of separation between different definitions of fairness is between individual and group fairness, which are related to the legal concepts of disparate treatment and disparate impact, respectively (Barocas and Selbst, <xref ref-type="bibr" rid="B25">2016</xref>).</p>
<list list-type="bullet">
<list-item><p><italic>Individual fairness</italic> considers fairness on an individual level and requires treating similar individuals similarly.</p></list-item>
<list-item><p><italic>Group fairness</italic> calculates fairness on a group level, requiring different groups to be treated equally.</p></list-item>
</list>
<p>Furthermore, one can differentiate between three principal approaches: fairness in acceptance rates, fairness in error rates, and fairness in outcome frequency (Barocas et al., <xref ref-type="bibr" rid="B23">2021</xref>). Verma and Julia (<xref ref-type="bibr" rid="B185">2018</xref>) provides an overview of the 20 most prominent definitions. One challenge, however, is selecting the &#x0201C;right&#x0201D; definition and metrics, as many different definitions of algorithmic fairness and related metrics exist. In many settings, these definitions contradict each other&#x02014;thus, it is usually not possible for an AI model to be fair in all three aspects. The appropriate metrics must be selected for a given application and its particularities. Several software packages are available that implement important metrics. Popular open-source frameworks include AIF 360 (Bellamy et al., <xref ref-type="bibr" rid="B27">2019</xref>), Fairlearn (Bird et al., <xref ref-type="bibr" rid="B32">2020</xref>), and Aequitas (Saleiro et al., <xref ref-type="bibr" rid="B159">2018</xref>).</p></sec>
<sec>
<title>3.2.4 Open issues and research challenges</title>
<p>Fairness is a concept highly context-dependent that, in practice, may require ethical consultation (John-Mathews, <xref ref-type="bibr" rid="B95">2022</xref>). No fairness definition applies to all contexts, and it seems an intrinsic&#x02014;and unsolvable&#x02014;challenge of the field to formulate legally compliant measurements mathematically (Wachter et al., <xref ref-type="bibr" rid="B186">2021</xref>). What is perceived as fair or unfair also varies between different cultural and legal settings. It remains unclear how to tune the fairness of an AI application intended to be used in multiple cultural or legal contexts (Srivastava et al., <xref ref-type="bibr" rid="B175">2019</xref>) and, more generally, how to apply and assess existing regulations, standards, and ethical constraints in practice (Costanza-Chock et al., <xref ref-type="bibr" rid="B54">2022</xref>).</p>
<p>From a more technical perspective, ensuring fairness when combining different AI components poses a significant challenge. This can be particularly difficult when reusing AI tools or algorithms with limited access to code, or when exchanging data audited only for a specific use case or application context. In fact, it has been shown that measures of algorithmic fairness are sensitive to any alterations in the input data and to even simple changes in train-test splits (Friedler et al., <xref ref-type="bibr" rid="B75">2019</xref>). In principle, monitoring fairness in AI systems that are in production is possible (e.g., Vasudevan and Kenthapadi, <xref ref-type="bibr" rid="B184">2020</xref>). However, it is still much more demanding to define when fairness criteria are met and when not because the algorithm&#x00027;s performance may change over time (e.g., Lazer et al., <xref ref-type="bibr" rid="B107">2014</xref>). The application of generative AI models presents additional challenges, especially in the context of language. Despite a significant body of research, it is still unclear how to effectively measure and evaluate their bias and how to transform these measurements to be suitable for application in various contexts or to consider different minority characteristics (Nemani et al., <xref ref-type="bibr" rid="B137">2023</xref>).</p>
<p>Finally, there is no standard to determine the adequate trade-off between different fairness metrics nor between fairness and accuracy. While there have been attempts to show that the fairness-accuracy trade-off is rather an issue of historical bias in data (Dutta et al., <xref ref-type="bibr" rid="B61">2020</xref>), it remains unclear how to generate an ideal, unbiased dataset as a standard in practice.</p></sec></sec>
<sec>
<title>3.3 Requirement 3: transparency and explainability</title>
<sec>
<title>3.3.1 Definition of transparency and explainability</title>
<p>Transparency and explainability are two related but distinct concepts. Explainability aims to enhance comprehension, build trust, and facilitate decision-making (Adadi and Berrada, <xref ref-type="bibr" rid="B2">2018</xref>). In contrast, the goal of transparency is to ensure understandability and accountability (Lepri et al., <xref ref-type="bibr" rid="B109">2018</xref>; Arias-Duart et al., <xref ref-type="bibr" rid="B15">2022</xref>; McDermid et al., <xref ref-type="bibr" rid="B119">2021</xref>). With transparent and explainable AI, users can better estimate the trustworthiness of AI systems since they can understand their inner workings and, consequently, their opportunities and limitations (Naiseh et al., <xref ref-type="bibr" rid="B135">2023</xref>). However, there is no final consensus on the definition and scope of transparency to date. Therefore, in this paper, we will focus on explainability as a means to achieve transparency in AI models.</p>
<p>Furthermore, including explainability methods in an AI system offers additional benefits, such as allowing for debugging and expert verification of the AI system, which can foster task accuracy and efficiency (Weber et al., <xref ref-type="bibr" rid="B191">2023</xref>) [e.g., in healthcare (Albahri et al., <xref ref-type="bibr" rid="B8">2023</xref>; Hulsen, <xref ref-type="bibr" rid="B94">2023</xref>)]. For example, Anders et al. (<xref ref-type="bibr" rid="B12">2022</xref>) improved a model&#x00027;s prediction accuracy by utilizing explainability methods to identify dataset samples that led the model to learn spurious correlations. Young et al. (<xref ref-type="bibr" rid="B203">2019</xref>) used explainable AI to help experts verify that models for melanoma detection relied on the correct data aspects for their predictions. Other researchers have developed explainability methods to facilitate iterative learning and improvement of AI models by identifying patterns, biases, or errors in the model&#x00027;s decision-making processes (Ribeiro et al., <xref ref-type="bibr" rid="B155">2016</xref>; Mehdiyev and Fettke, <xref ref-type="bibr" rid="B121">2021</xref>).</p></sec>
<sec>
<title>3.3.2 Methods to establish transparency and explainability</title>
<p>Methods to make AI systems explainable are often summarized under the umbrella term &#x0201C;Explainable AI (XAI)&#x0201D; (Holzinger et al., <xref ref-type="bibr" rid="B91">2022</xref>), and sometimes also interpretable AI (Molnar, <xref ref-type="bibr" rid="B124">2020</xref>). XAI aims to increase transparency and explainability in AI systems to ensure trust, understanding, and accountability. With respect to the AI-lifecycle (see Section 3), XAI is relevant in all three phases: in the design phase, for understanding and incorporating stakeholders&#x00027; explainability requirements; in the development phase, for understanding important data aspects, performing error analysis and model refinement; and finally, in the deployment phase for continuous model verification and enhancing user trust. XAI methods vary in their approach toward achieving these goals and can be categorized based on their <italic>scope</italic> and <italic>model dependence</italic>. The term <italic>scope</italic> refers to whether XAI methods can produce global or local explanations (Samek et al., <xref ref-type="bibr" rid="B161">2021</xref>). Global explanations aim to explain the AI model as a whole and, thus, provide insight into the model&#x00027;s general decision-making process, e.g., SHAP (Lundberg and Lee, <xref ref-type="bibr" rid="B117">2017</xref>). In contrast, local explanations focus on the model&#x00027;s decision-making process in regard to a single sample, making the explanation more specific [e.g., LIME (Ribeiro et al., <xref ref-type="bibr" rid="B155">2016</xref>)]. Global explanations tend to be computationally more expensive, as they need to consider the entire training input space, whereas local explanations might work on one input sample.</p>
<p>Furthermore, XAI methods can be classified as &#x0201C;model-agnostic" or &#x0201C;model-specific" methods (Arrieta et al., <xref ref-type="bibr" rid="B16">2020</xref>), according to their <italic>model dependence</italic>. Model-agnostic XAI methods can provide explainability and transparency for any AI system. In contrast, model-specific XAI methods are tailored to a single AI architecture, which may limit their compatibility with other AI systems. However, they tend to create more accurate and translucent (i.e., the extent to which the explanations rely on particularities of the inner workings of the AI system) explanations than model-agnostic methods (Carvalho et al., <xref ref-type="bibr" rid="B49">2019</xref>). Additionally, model-specific XAI methods can not be implemented for every AI system. Meanwhile, model-agnostic XAI methods can be implemented on every AI system, as they often use the AI system as an oracle. They do so by probing the model many times to estimate the effects of the input on the model prediction, which can lead to expensive computations. Examples of model-agnostic XAI methods are SHAP (Lundberg and Lee, <xref ref-type="bibr" rid="B117">2017</xref>), LIME (Ribeiro et al., <xref ref-type="bibr" rid="B155">2016</xref>) and the broader category of counterfactual explanations (Guidotti, <xref ref-type="bibr" rid="B81">2022</xref>); model-specific XAI methods are DeepLIFT (Shrikumar et al., <xref ref-type="bibr" rid="B168">2017</xref>) and Integrated Gradients (Sundararajan et al., <xref ref-type="bibr" rid="B178">2017</xref>).</p>
<p>It is a common belief that &#x0201C;white-box&#x0201D; models&#x02014;models whose &#x0201C;inner workings&#x0201D; can be inspected&#x02014;are immediately interpretable and transparent. However, they often have lower prediction accuracy than more complex models (Moreira et al., <xref ref-type="bibr" rid="B127">2022</xref>). In addition, white-box models, e.g., Linear Regression and Decision Trees, often need extra steps to be used or treated as &#x0201C;full-fledged&#x0201D; XAI methods because in order to be most effective, XAI methods are required to be understandable and not overwhelming to their target users, meaning that they are specifically tailored to meet their requirements (Miller et al., <xref ref-type="bibr" rid="B123">2017</xref>). Social science research regards high-quality explanations as a form of conversation and proposes explanation theories like temporal causality, social constructivism, and attribution theory (Mendoza et al., <xref ref-type="bibr" rid="B122">2023</xref>).</p>
<p>Deep learning models have succeeded across various domains by utilizing computational units called neurons, ordered in sequential layers forming neural network (NN) models. NNs can autonomously learn meaningful internal features without manual feature engineering (LeCun et al., <xref ref-type="bibr" rid="B108">2015</xref>). Consequently, to train the models, we often use raw data directly or include all features, regardless of complexity (Roy et al., <xref ref-type="bibr" rid="B157">2015</xref>). However, while NNs map inputs directly to outcomes, they do not disclose how features are weighted in relation to the model&#x00027;s output (Zhao et al., <xref ref-type="bibr" rid="B207">2015</xref>).</p>
<p>XAI methods can provide explanations in many different ways. <italic>Feature attribution methods</italic> generate values for each input feature, highlighting its importance to the AI model&#x00027;s predictions. However, these methods can be sensitive to input noise and correlated features, resulting in misleading conclusions (Adebayo et al., <xref ref-type="bibr" rid="B3">2018</xref>). They are commonly presented textually (numerically), via bar charts (Ribeiro et al., <xref ref-type="bibr" rid="B155">2016</xref>), or via heatmaps (Sundararajan et al., <xref ref-type="bibr" rid="B178">2017</xref>). XAI methods can also provide explanations by visualizing the models&#x00027; internals, e.g., activation maps in Convolutional Neural Networks, which can quickly become too complex when dealing with many neurons (Carter et al., <xref ref-type="bibr" rid="B48">2019</xref>). <italic>Counterfactual explanations</italic> are a category of explanations that aims to answer the &#x0201C;why&#x0201D; question with &#x0201C;because if it was <italic>something different</italic>, it would be <italic>this other thing</italic> instead&#x0201D; (Guidotti, <xref ref-type="bibr" rid="B81">2022</xref>). Counterfactuals are typically computationally intensive, and generating meaningful counterfactual examples depends on the task context (Artelt and Hammer, <xref ref-type="bibr" rid="B17">2019</xref>).</p>
<p>Undoubtedly, explaining AI requires numerous considerations. Despite inherent limitations, each explanation technique enhances the explainability and transparency of AI systems, thereby advancing the overarching objective of fostering trustworthy and accountable AI applications. Many software libraries exist that make employing XAI methods straightforward. For Python, the libraries SHAP (Lundberg and Lee, <xref ref-type="bibr" rid="B117">2017</xref>), LIME (Ribeiro et al., <xref ref-type="bibr" rid="B155">2016</xref>), Captum (Kokhlikyan et al., <xref ref-type="bibr" rid="B102">2020</xref>), and scikit-learn (Pedregosa, F. et al., <xref ref-type="bibr" rid="B145">2011</xref>) are widespread and cover most XAI method categories. The DALEX (Biecek, <xref ref-type="bibr" rid="B30">2018</xref>) library offers model-agnostic explanations for the programming language R.</p></sec>
<sec>
<title>3.3.3 Methods to evaluate transparency and explainability</title>
<p>Evaluating explanation methods is vital for assessing their correctness, efficacy, and practical utility. Various approaches for estimating the effectiveness and quality of explanations have been introduced and can be divided into the following categories (Doshi-Velez and Kim, <xref ref-type="bibr" rid="B58">2017</xref>):</p>
<list list-type="bullet">
<list-item><p><italic>Application-grounded evaluations</italic> that involve human participants performing realistic tasks and offer insights into how XAI methods work in real-world scenarios.</p></list-item>
<list-item><p><italic>Human-grounded evaluations</italic> that use simplified tasks for human participants to assess the comprehensibility and usefulness of explanations provided by the AI systems.</p></list-item>
<list-item><p><italic>Functionally-grounded evaluations</italic> that rely on proxy tasks without human involvement, focusing on XAI algorithms&#x00027; functionality and their scores against a pre-defined metric of interpretable quality.</p></list-item>
</list>
<p>While application and human-grounded approaches focus on the plausibility and usefulness of explanations to users, functionally-grounded evaluations estimate the <italic>correctness</italic> of XAI algorithms. Various properties of explanation methods can be examined to determine if they function correctly (Hedstr&#x000F6;m et al., <xref ref-type="bibr" rid="B87">2023</xref>). Some of these properties are:</p>
<list list-type="bullet">
<list-item><p><italic>Faithfulness</italic> (Alvarez-Melis and Jaakkola, <xref ref-type="bibr" rid="B11">2018b</xref>; Samek et al., <xref ref-type="bibr" rid="B160">2016</xref>; &#x00160;imi&#x00107; et al., <xref ref-type="bibr" rid="B169">2022</xref>) estimates how accurately explanation methods identify features in the input driving the model prediction.</p></list-item>
<list-item><p><italic>Robustness</italic> (Montavon et al., <xref ref-type="bibr" rid="B125">2018</xref>; Alvarez-Melis and Jaakkola, <xref ref-type="bibr" rid="B10">2018a</xref>) measures an explanation method&#x00027;s sensitivity to input perturbations.</p></list-item>
<list-item><p><italic>Localization</italic> (Selvaraju et al., <xref ref-type="bibr" rid="B165">2017</xref>; Fong and Vedaldi, <xref ref-type="bibr" rid="B74">2017</xref>) identifies if the explanation method focuses correctly on the desired regions of interest.</p></list-item>
<list-item><p><italic>Complexity</italic> (Bhatt et al., <xref ref-type="bibr" rid="B29">2020</xref>; Nguyen and Mart&#x00301;&#x00131;nez, <xref ref-type="bibr" rid="B139">2020</xref>) measures the conciseness of explanations, where less complex explanations are deemed more interpretable than more complex ones.</p></list-item>
<list-item><p><italic>Randomization</italic> quantifies an explanation method&#x00027;s sensitivity to modifications of model parameters.</p></list-item>
<list-item><p><italic>Axioms</italic> (Adebayo et al., <xref ref-type="bibr" rid="B3">2018</xref>; Kindermans et al., <xref ref-type="bibr" rid="B100">2019</xref>) define criteria that an explanation method has to fulfill.</p></list-item>
</list>
<p>Hence, careful identification of evaluation aspects is necessary to address context-specific concerns, such as faithfulness, robustness, or comprehensibility. For a detailed overview of evaluation metrics for transparency and explainability, please also see Hulsen (<xref ref-type="bibr" rid="B94">2023</xref>), in which metrics such as simulatability, decomposability, coherence, or comprehensiveness are mentioned. Unfortunately, software libraries that offer metrics for validating explanation methods are scarce; among the few existing ones are Quantus (Hedstr&#x000F6;m et al., <xref ref-type="bibr" rid="B87">2023</xref>) and AI Explainability 360 (Arya et al., <xref ref-type="bibr" rid="B18">2019</xref>).</p></sec>
<sec>
<title>3.3.4 Open issues and research challenges</title>
<p>The requirement for transparency and explainability of AI faces several open challenges. First and foremost, the research community needs to fully agree on a common, clear, and precise definition for transparency in AI systems, which currently leads to ambiguity regarding what explanations should entail. For instance, properly calibrating AI explanations to instill the correct amount of trust in AI models is crucial but complex (Wang et al., <xref ref-type="bibr" rid="B189">2019</xref>), as it requires a balance between providing understandable insights without oversimplifying or overwhelming users and, at the same time, without over or underselling the explained AI model&#x00027;s capabilities. Additionally, tailoring explanations for diverse user groups and individuals remains challenging, as different stakeholders require different explanations at varying levels of granularity and detail (Miller et al., <xref ref-type="bibr" rid="B123">2017</xref>; Mendoza et al., <xref ref-type="bibr" rid="B122">2023</xref>). Furthermore, the evaluation of transparency and explainability of AI models is challenging, and developing intuitive user interfaces for explanations poses a design challenge, requiring informative yet user-friendly interfaces that follow &#x0201C;XAI UI guidelines&#x0201D; (Liao et al., <xref ref-type="bibr" rid="B114">2020</xref>; Wolf, <xref ref-type="bibr" rid="B198">2019</xref>).</p>
<p>Finally, ensuring transparency and explainability in large language models and generative AI systems presents unique difficulties due to their complexity, and it is also unclear how their explanations should look like (Schneider, <xref ref-type="bibr" rid="B164">2024</xref>).</p></sec></sec>
<sec>
<title>3.4 Requirement 4: robustness and accuracy</title>
<sec>
<title>3.4.1 Definition of robustness and accuracy</title>
<p>Robustness and accuracy are key properties of any AI system, and ensuring them is an essential part of the AI model development. Robustness and accuracy&#x02014;in loose terms&#x02014;refer to how &#x0201C;adequate&#x0201D; or &#x0201C;correct&#x0201D; the outputs of an AI model are. In contrast to other requirements&#x02014;such as fairness or transparency&#x02014;sufficient robustness and accuracy are required for <italic>any</italic> AI model, independent of its specific purpose (Huber, <xref ref-type="bibr" rid="B93">2004</xref>).</p>
<p>AI training algorithms are typically designed for general problem settings (e.g., image-classification tasks). A specific AI model is then developed for a particular problem. In many problem settings, various models can be employed. However, in complex settings, identifying a suitable model becomes challenging, often requiring the application of a model despite uncertainties regarding its suitability. In such a case, it is important to use models that produce reasonable results even if they are used in settings they were originally not designed for. Under challenging conditions, some models may behave unpredictably and produce unstable outputs, whereas other models exhibit more constant behavior, and the quality of their outputs differs only slightly from the optimal setting. Clearly, it is preferable to use the latter class of models. More concretely, Huber (<xref ref-type="bibr" rid="B93">2004</xref>) outline three key properties an AI model should ideally possess. The model should: (1) achieve optimal or near-optimal results if it is applied in exactly the setting it was designed for; (2) degrade the quality of the results only slightly if it is subject to small deviations from the assumed setting; (3) not trigger nonsensical or dangerous outputs if it is applied in settings with large deviations from the assumed setting. An AI model is considered <italic>robust</italic> if it meets properties (2) and (3), while property (1) is essential to ensure a sufficiently <italic>accurate</italic> model.</p>
<p>It is optimal to achieve high values in both, accuracy and robustness, but this is rarely possible. Instead, there is typically a trade-off between robustness and accuracy. While some models are more robust and can be applied across different settings, they come at the cost of lower accuracy. For example, a face detection algorithm could have very high accuracy in a highly specific setting, e.g., fixed camera type, fixed angle, and fixed lightning conditions, but might fail as soon as one of those parameters changes. A different model, on the other hand, might show slightly lower accuracy but perform similarly in various settings, e.g., different camera types and lighting conditions.</p>
<p>Considering robustness and accuracy are crucial in all phases of the AI-lifecycle (see Section 2). In the design phase, it is important to make choices that do not compromise the accuracy of the model, for example, in the selection of appropriate training and testing data. The development phase is particularly essential, where one of the core tasks of every AI system development is to ensure these qualities. Finally, in the deployment phase, robustness and accuracy metrics need constant monitoring&#x02014;especially in the case of continuously changing systems&#x02014;to ensure a well-working AI model (Hamon et al., <xref ref-type="bibr" rid="B84">2020</xref>).</p></sec>
<sec>
<title>3.4.2 Methods to establish robustness and accuracy</title>
<p>Ensuring accuracy is the core of AI model development and part of all best practices. Additional core considerations are the appropriate choice of (1) target metrics the model is trained on, (2) data splitting techniques (e.g., train-test-splits), and (3) model selection methods. These three points are part of AI model developments that, in practice, are often done properly but not documented in a sufficient manner. To generate trust in AI models, it is essential to both deliver quality and document all relevant choices made in the process. These include, for example, the choice of suitable evaluation metrics, i.e., not only is it necessary to document the choice (e.g., &#x0201C;F1-score&#x0201D;), but also the reasoning for that choice (e.g., &#x0201C;classification problem with unbalanced data&#x0201D;) (Huber, <xref ref-type="bibr" rid="B93">2004</xref>; Hamon et al., <xref ref-type="bibr" rid="B84">2020</xref>).</p>
<p>Ensuring robustness can be done in two principal ways: (1) by restricting potential models to model types shown to be more robust (e.g., multilinear regression is generally more robust than deep learning), or (2) by explicitly evaluating model robustness and incorporating it in the model selection process. In the process of model selection, certain model types can be adapted to increase robustness. For example, fragile models can improve robustness by introducing mechanics that ignore certain data points or limit their effect, e.g., a drop-out layer in neural networks (Krizhevsky et al., <xref ref-type="bibr" rid="B106">2012</xref>), or thresholds (Kim and Scott, <xref ref-type="bibr" rid="B99">2012</xref>). This has the advantage that the model learns to rely less on specific data points and focus more on the general information depicted in the majority of the data. However, &#x0201C;reserved&#x0201D; data usage has a cost: The model has less data to work with, which puts it at a statistical disadvantage compared to fragile models that use all data. This cost is particularly high when the model is used in a setting where accuracy is more important than robustness (Fisher, <xref ref-type="bibr" rid="B72">1922</xref>).</p></sec>
<sec>
<title>3.4.3 Methods to evaluate robustness and accuracy</title>
<p>In the AI literature, there are many different forms of robustness, e.g., robustness to domain shift (Blanchard et al., <xref ref-type="bibr" rid="B35">2011</xref>; Muandet et al., <xref ref-type="bibr" rid="B129">2013</xref>; Gulrajani and Lopez-Paz, <xref ref-type="bibr" rid="B82">2020</xref>), adversarial robustness (Nicolae et al., <xref ref-type="bibr" rid="B140">2019</xref>; Xu et al., <xref ref-type="bibr" rid="B200">2020</xref>), robustness to noise (Zhu and Wu, <xref ref-type="bibr" rid="B208">2004</xref>; Garcia et al., <xref ref-type="bibr" rid="B79">2015</xref>), robustness to non-adversarial perturbations (Hendrycks and Dietterich, <xref ref-type="bibr" rid="B88">2019</xref>; Rusak et al., <xref ref-type="bibr" rid="B158">2020</xref>; Scher and Tr&#x000FC;gler, <xref ref-type="bibr" rid="B163">2023</xref>), and others. While some generic robustness scores have been proposed (Weng et al., <xref ref-type="bibr" rid="B194">2018</xref>; Sharma et al., <xref ref-type="bibr" rid="B167">2020</xref>), they do, in fact, only measure specific types of adversarial robustness. Therefore, there is no single unified notion of robustness. Accordingly, as with most other aspects of trustworthy AI, the type of robustness to be considered depends on the context.</p>
<p>Accuracy can be measured with a wide variety of metrics. In technical terms, accuracy is simply the fraction of correct outputs of an AI model (Naidu et al., <xref ref-type="bibr" rid="B134">2023</xref>). The goal of measuring accuracy is to measure how &#x0201C;good&#x0201D; or &#x0201C;correct&#x0201D; the outputs of the AI model are. How &#x0201C;good&#x0201D; or &#x0201C;correct&#x0201D; is defined in practice and highly depends on the application at hand. Therefore, there is no single generally applicable accuracy metric. The choice of which metric or metrics are applicable depends on the type of problem the AI model attempts to solve (e.g., regression, classification, ranking, translation), and on the particular properties of the application. For instance, for classification tasks with balanced classes, accuracy is a useful metric. However, classification tasks with highly imbalanced data, this can be misleading, and metrics such as precision and recall are more appropriate. Regression tasks require very different evaluation metrics than classification tasks. Examples are root-mean-square error or mean absolute error. Which one is more appropriate again depends on the application at hand. The same holds for ranking tasks, which require yet other types of metrics (such as mean reciprocal rank or mean average precision). An overview of these commonly used metrics can be found in Poretschkin et al. (<xref ref-type="bibr" rid="B150">2023</xref>).</p></sec>
<sec>
<title>3.4.4 Open issues and research challenges</title>
<p>The ongoing surge in generative AI models has opened a new challenge for existing models with respect to accuracy and robustness. It has been shown that generative models are, to a certain extent, capable of producing adversarial examples that cause catastrophic outputs in existing fragile AI models (Han et al., <xref ref-type="bibr" rid="B85">2023</xref>). Moreover, some of these examples are transferable from one system to the next and can be re-used to cause failure in a number of different AI systems (Wang Z. et al., <xref ref-type="bibr" rid="B190">2023</xref>). Currently, there is no widely applicable easy strategy to address these issues. Existing fragile models need to be replaced with more robust models, and higher accuracy needs to be established for robust models, which are currently not able to compete with their fragile counterparts.</p>
<p>Providing accuracy is the core of machine learning and AI, and thus, methods ensuring AI applications are accurate need to be integrated with the development and improvement of the models. Accuracy evaluation metrics are well-established in statistics and machine learning, and their computation is generally straightforward. However, the choice of a proper metric and the definition of its thresholds are much more complex. While best practices exist, no formal guidelines are available. Also, despite a wide range of established accuracy metrics, there is a need for additional, new accuracy metrics that are specifically developed and tailored to the particularities of distinct applications (Naidu et al., <xref ref-type="bibr" rid="B134">2023</xref>) &#x02014;and perhaps also tailored to permit robust solutions.</p>
<p>The field of robustness faces a variety of open issues and limitations. Robustness is a broad concept that current research strands do not necessarily cover in all aspects. In part, no specific methods&#x02014;besides best-practice examples&#x02014;are available for increasing robustness (e.g., robustness against noise). Especially the problem of adversarial attacks is constituted in a &#x0201C;cat and mouse game&#x0201D;: if a specific attack strategy is known, AI systems can be made robust against it by incorporating the attack in the training procedure&#x02014;known as adversarial training. However, this does not guarantee robustness toward a new attack that has not yet been part of the training. Another open issue is caused by composite systems, where multiple AI components are combined or in situations where AI evaluation is part of a larger product/solution. Moreover, yet unanswered, is how to assess accuracy and robustness in evolving (learning) AI systems that are constantly updated (in some cases with every single user interaction) (Hamon et al., <xref ref-type="bibr" rid="B84">2020</xref>). In general, data quality, as well as model training and selection, are very important for AI systems, as these aspects influence accuracy and robustness, among other qualities such as fairness. Nonetheless, currently, no unified quality concept is available, even though basic automated tests are feasible.</p></sec></sec>
<sec>
<title>3.5 Requirement 5: privacy and security</title>
<sec>
<title>3.5.1 Definition of privacy and security</title>
<p>Privacy and security are indispensable pillars supporting the trustworthiness and ethical use of AI systems. Privacy refers to the data used as input for the AI model and to protecting information that belongs to the data owner. This information must not be disclosed to any third parties and may only be disclosed to parties that the data owner defines. Security, on the other hand, pertains to the AI model itself and is linked to defending it against any malicious attacks that aim to impact or manipulate it in an undesired or harmful way. Both privacy and security risks can arise along the whole life cycle of AI systems (see Section 2). Existing countermeasures span a broad spectrum, encompassing methods from manipulating the input data of AI models for ensuring privacy and security and designing AI models that are by themselves private and secure to recent advances that allow the protection of AI models during the inference process, i.e., during deployment (Elliott and Soifer, <xref ref-type="bibr" rid="B64">2022</xref>).</p>
<p>If AI is utilized in critical areas such as healthcare, autonomous vehicles, or national security, it may even endanger human safety. Incidents like the unintended memorization of sensitive information by large language models<xref ref-type="fn" rid="fn0004"><sup>4</sup></xref> highlight the tangible privacy and security risks associated with AI. These examples serve as a reminder of AI models&#x00027; potential to compromise privacy and security inadvertently. In response, regulatory bodies, particularly in the European Union, have been proactive in updating legal frameworks to address these challenges: The General Data Protection Regulation (GDPR) and the AI Act are prime examples of such regulatory efforts, aiming to establish clear guidelines for AI design, development, and deployment (Zaeem and Barber, <xref ref-type="bibr" rid="B204">2020</xref>).</p></sec>
<sec>
<title>3.5.2 Methods to establish privacy and security</title>
<p>Understanding the weaknesses of AI systems and identifying the diverse kinds of attacks on privacy and security is critical for developing defense strategies and, consequently, evaluating their effectiveness. Attacks can be classified based on several aspects, including the attacker&#x00027;s capabilities and the attack goal. For example, attackers can deviate from the agreed protocol (active/malicious) or try to learn as much as possible without violating the protocol (passive/semi-honest/honest-but-curious). Moreover, an attacker may be assumed to have finite or infinite computational power. Based on the attacker&#x00027;s knowledge, one can differentiate between black-box attacks (which only access the model&#x00027;s output), white-box attacks (which access the full model), and gray-box attacks (which gain partial access). In the following, we classify attacks based on the attack goal, i.e., evasion attacks, poisoning and backdoor attacks, and privacy attacks (BSI, <xref ref-type="bibr" rid="B41">2022</xref>; Bae et al., <xref ref-type="bibr" rid="B19">2018</xref>):</p>
<list list-type="order">
<list-item><p><italic>Evasion attacks</italic> (including adversarial attacks) aim to mislead AI models through carefully crafted inputs, forcing incorrect predictions.</p></list-item>
<list-item><p><italic>Poisoning attacks</italic> corrupt the training process, while <italic>backdoor attacks</italic> insert hidden triggers into models.</p></list-item>
<list-item><p><italic>Privacy attacks</italic> seek to extract sensitive information from AI models. The most common privacy attacks include:</p></list-item></list>
<list list-type="bullet">
<list-item><p>Membership inference attacks aim to determine whether a specific data sample was used in the training phase of the AI model.</p></list-item>
<list-item><p>Attribute inference attacks aim to infer sensitive attributes, e.g., the gender of individual records.</p></list-item>
<list-item><p>Model inversion attacks aim to infer features that characterize classes from the training data.</p></list-item>
<list-item><p>Model extraction and stealing attacks aim to reconstruct the model&#x00027;s behavior, architecture, and/or parameters.</p></list-item>
</list>
<p>Adilova et al. (<xref ref-type="bibr" rid="B4">2022</xref>) list best practices to defend against the aforementioned attacks. In the following, we briefly provide examples for each class of attacks. Countermeasures against <italic>evasion attacks</italic> include: (1) certification or verification of output bounds, i.e., utilizing certification methods to calculate guarantees on the output distribution to certify the AI model&#x00027;s robustness, (2) adversarial retraining, i.e., incorporating perturbed samples into the training process, (3) injection of randomness into training, i.e., using random transformations to protect against attacks, (4) use of more training data, i.e., enhancing adversarial robustness with larger and more diverse training datasets, (5) multi-objective optimization, i.e., not only optimizing for accuracy but balancing between adversarial robustness and task-specific accuracy, and (6) attack detection, i.e., implementing detection methods for malicious inputs. The risk of <italic>backdoor and poisoning attacks</italic> can effectively be mitigated by the following strategies: (1) use of trusted sources, i.e., ensuring reliability and trustworthiness of data models; (2) random data augmentation, i.e., employing data augmentation techniques to mitigate the effect of poisoned samples; (3) use of an auxiliary pristine dataset, i.e., supporting training with trusted data to dilute the impact of poisoned samples; (4) attack detection, i.e., applying techniques to identify poisoned samples or models, including analysis of data distributions and model inspections; (5) model cleaning, i.e., utilizing methods like pruning, retraining, or differential privacy to eliminate the influence of triggers or poisoned data; and (6) adversarial training, i.e., adapting adversarial training approaches to counter poisoning attacks, enhancing model resilience.</p>
<p>Overall, defending the security of AI models against a variety of attacks involves a multifaceted approach that combines diverse techniques and practices, highlighting the need for AI practitioners to continuously assess and update their defense strategies. Similarly, the development of privacy-enhancing technologies (PETs) has been instrumental in protecting AI models from <bold>privacy attacks</bold>. The following (incomprehensive) list of PETs details the most important technologies, which currently form the forefront of research in private and secure AI computations.</p>
<list list-type="bullet">
<list-item><p><italic>Homomorphic encryption (HE)</italic> (Gentry, <xref ref-type="bibr" rid="B80">2009</xref>; Rechberger and Walch, <xref ref-type="bibr" rid="B153">2022</xref>; Smart, <xref ref-type="bibr" rid="B172">2016</xref>; Phong et al., <xref ref-type="bibr" rid="B148">2018</xref>) supports the performing of certain operations on encrypted data (i.e., without decrypting it). This allows privacy in cloud-based AI services to be maintained without exposing private data or model details. However, HE requires substantial computational resources and entails high computational costs.</p></list-item>
<list-item><p><italic>Secure multi-party computation (MPC)</italic> (Rechberger and Walch, <xref ref-type="bibr" rid="B153">2022</xref>; Evans et al., <xref ref-type="bibr" rid="B68">2018</xref>) allows collaborative computation without revealing individual inputs. In the context of AI, MPC is especially useful for collaborative learning and private classification, though it requires significant communication overhead for many participants.</p></list-item>
<list-item><p><italic>Differential privacy (DP)</italic> (Dwork, <xref ref-type="bibr" rid="B62">2008</xref>; Dwork and Roth, <xref ref-type="bibr" rid="B63">2014</xref>) bounds the maximum amount of information that an AI model&#x00027;s output discloses about an individual data point by incorporating curated noise into the computation. Specifically, noise can be added either to the input data, during the training process, or to the output (Friedman et al., <xref ref-type="bibr" rid="B76">2016</xref>). While effective in various AI applications, including deep learning (Abadi et al., <xref ref-type="bibr" rid="B1">2016</xref>) and recommender systems (M&#x000FC;llner et al., <xref ref-type="bibr" rid="B131">2023</xref>), DP&#x00027;s main challenge is the trade-off between privacy protection and accuracy.</p></list-item>
<list-item><p><italic>Federated learning (FL)</italic> (Zhang et al., <xref ref-type="bibr" rid="B206">2021</xref>; Li et al., <xref ref-type="bibr" rid="B112">2020</xref>) is a machine learning approach that allows multiple clients, like mobile phones, to collaboratively learn a model by training locally and sharing updates with a central server. This method enhances privacy by keeping data local, although there is a risk of data reconstruction from model updates (Yin et al., <xref ref-type="bibr" rid="B202">2021</xref>; Nasr et al., <xref ref-type="bibr" rid="B136">2019</xref>; Ren et al., <xref ref-type="bibr" rid="B154">2022</xref>).</p></list-item>
<list-item><p><italic>Synthetic data</italic> (Slokom, <xref ref-type="bibr" rid="B171">2018</xref>; Liu et al., <xref ref-type="bibr" rid="B115">2022</xref>) mimics real data&#x00027;s statistical features to enable the AI model to still learn the real data&#x00027;s features, but without using the real data. This offers a way to preserve privacy in data sharing, yet it is not immune to reconstruction risks (Stadler et al., <xref ref-type="bibr" rid="B176">2022</xref>).</p></list-item>
<list-item><p><italic>Transfer learning</italic> (Zhuang et al., <xref ref-type="bibr" rid="B209">2020</xref>), while not a PET <italic>per se</italic>, contributes to privacy by fine-tuning pre-trained models on new tasks with minimal data, reducing the need for large private datasets (Gao et al., <xref ref-type="bibr" rid="B78">2019</xref>). Similar ideas are also employed by PETs based on meta-learning (Muellner et al., <xref ref-type="bibr" rid="B130">2021</xref>).</p></list-item>
</list>
<p>The described defense methods can also be combined to increase privacy and security. For example, DP can mitigate the risk of reconstruction in FL (Wei et al., <xref ref-type="bibr" rid="B192">2020</xref>) and synthetic data (Tai et al., <xref ref-type="bibr" rid="B180">2022</xref>; Stadler et al., <xref ref-type="bibr" rid="B176">2022</xref>).</p></sec>
<sec>
<title>3.5.3 Methods to evaluate privacy and security</title>
<p>The vulnerability of AI models to privacy and security attacks can be assessed using two complementary approaches: mathematical analysis and attack-based evaluation. <italic>Mathematical analysis</italic> offers formal proofs of privacy and security features within a system, much like cryptography, guaranteeing system security under certain assumptions (e.g., DP). This method is crucial, especially when introducing new privacy or security techniques, as it requires thorough checks for implementation errors and the appropriate selection of parameters. On the other hand, <italic>attack-based evaluation</italic> gives us practical insight into how an AI model reacts to various attack strategies. This method tests the model&#x00027;s vulnerability to different attacks and determines its resilience by using various metrics (Wagner and Eckhoff, <xref ref-type="bibr" rid="B187">2018</xref>; Pendleton et al., <xref ref-type="bibr" rid="B146">2016</xref>). These metrics might include the attacks&#x00027; success rate, the effort required to breach the model (measured in iterations), the precision of the attack, and the smallest necessary data alterations to compromise the model successfully (BSI, <xref ref-type="bibr" rid="B41">2022</xref>). The choice of metrics depends on the nature of the attack and on assumptions about the attacker&#x00027;s skills and knowledge. It is tailored to each specific scenario and model based on potential threats and existing literature. However, it is important to acknowledge the limitations of attack-based evaluations. While they can pinpoint specific weaknesses and vulnerabilities, they do not offer a comprehensive guarantee of privacy or security. Additionally, these evaluations only cover known attack scenarios, leaving the potential for undetected vulnerabilities against new or complex attack techniques.</p></sec>
<sec>
<title>3.5.4 Open issues and research challenges</title>
<p>Despite the existing countermeasures, the AI privacy and security field still faces numerous unresolved challenges. Many defense strategies cannot fully mitigate the models&#x00027; vulnerability to attacks, especially not to adversarial and poisoning attacks. Additional challenges emerge with the increasing advancement of generative AI, particularly in models that rely heavily on unstructured data such as text. For example, establishing clear boundaries on what constitutes private information becomes increasingly difficult due to the inherent complexities of unstructured data (Brown et al., <xref ref-type="bibr" rid="B40">2022</xref>). PETs often introduce trade-offs, such as increased computational demands (HE and MPC) (Moore et al., <xref ref-type="bibr" rid="B126">2014</xref>), reduced prediction accuracy and increased unfairness (DP) (Abadi et al., <xref ref-type="bibr" rid="B1">2016</xref>; Bagdasaryan et al., <xref ref-type="bibr" rid="B21">2019</xref>; M&#x000FC;llner et al., <xref ref-type="bibr" rid="B132">2024</xref>), or a surge in communication overhead while having no privacy guarantees (FL) (Almanifi et al., <xref ref-type="bibr" rid="B9">2023</xref>; Bagdasaryan et al., <xref ref-type="bibr" rid="B22">2020</xref>). Therefore, integrating PETs smoothly into AI systems without compromising performance remains complex and requires further research. Just as for fairness and robustness, evaluating privacy and security when combining multiple AI components is challenging. Adding components that protect against one identified risk can even introduce new vulnerabilities (Debenedetti et al., <xref ref-type="bibr" rid="B55">2023</xref>).</p>
<p>In general, fostering secure model sharing and privacy-preserving collaboration, developing standardized evaluation metrics, and preparing for advanced AI threats necessitate a collaborative approach among researchers, developers, and policymakers. Ongoing research and shared best practices will be crucial for building a secure, privacy-conscious AI ecosystem.</p></sec></sec>
<sec>
<title>3.6 Requirement 6: accountability</title>
<sec>
<title>3.6.1 Definition of accountability</title>
<p>Another key requirement for trustworthy AI is accountability. At its heart, accountability is the obligation to notify an authority of one&#x00027;s conduct and to justify it (Bovens, <xref ref-type="bibr" rid="B36">2007</xref>; Brandsma and Schillemans, <xref ref-type="bibr" rid="B38">2012</xref>; Novelli et al., <xref ref-type="bibr" rid="B141">2023</xref>; Hauer et al., <xref ref-type="bibr" rid="B86">2023</xref>; Wieringa, <xref ref-type="bibr" rid="B195">2020</xref>), whereas responsibility includes explicit obligations defined in advance (Bivins, <xref ref-type="bibr" rid="B34">2006</xref>) and can be seen as a subcategory of accountability (Gabriel et al., <xref ref-type="bibr" rid="B77">2021</xref>). Liability is closely related to accountability and means legal responsibility, including sanctions for misbehavior. In this article, we, therefore, see liability as a sub-concept of accountability and solely use the term accountability.</p>
<p>From a conceptual perspective, accountability can also be defined as a virtue or as a mechanism (Bovens, <xref ref-type="bibr" rid="B37">2010</xref>). Accountability &#x0201C;refers to the idea that one is responsible for their action&#x02014;and as a corollary their consequences&#x02014;and must be able to explain their aims, motivations, and reasons&#x0201D;.<xref ref-type="fn" rid="fn0005"><sup>5</sup></xref></p>
<p>The definition of Bovens (<xref ref-type="bibr" rid="B36">2007</xref>) is widely used as the basis for addressing accountability and identifies the following key elements of accountability: actor, forum, relationship between these two, account, and consequences. The actors, as natural persons, groups or organizations (e.g., developers, deployers, manufacturers, or users of AI systems), shall be able to explain their actions (e.g., used models and data, intended use, planned outcomes, and potential malfunctions of AI systems) by certain criteria to the forum (e.g., a court, a supervisor, an auditor), that can &#x0201C;pose questions and pass judgments&#x0201D;. The relationship between actor and forum can vary and involves individual, hierarchical, collective and corporate accountability. Finally, there will be consequences (e.g., fines for non-compliance with rules).</p></sec>
<sec>
<title>3.6.2 Methods to establish accountability</title>
<p>When addressing accountability features such as context, the range of actions taken, the acting entity, the forum as the bearer of interests and imposed standards, processes, and implications must be considered (Bovens, <xref ref-type="bibr" rid="B36">2007</xref>) to be able to achieve compliance, report, oversight, and enforcement (Novelli et al., <xref ref-type="bibr" rid="B141">2023</xref>). Thus, accountability is always relational (Bovens, <xref ref-type="bibr" rid="B36">2007</xref>), contextual (Lewis et al., <xref ref-type="bibr" rid="B110">2020</xref>) and involves single persons, other entities, as well as groups and societies. Depending on impacts, different levels of accountability are required (Cech, <xref ref-type="bibr" rid="B50">2021</xref>).</p>
<p>Accountability systems range from hard law regulations over functional roles within organizations (Novelli et al., <xref ref-type="bibr" rid="B141">2023</xref>) to social norms that, in turn, form the basis for decision-making and behavior (Gabriel et al., <xref ref-type="bibr" rid="B77">2021</xref>). In the field of software development, responsibility involves maintaining quality in the design process (Eriks&#x000E9;n, <xref ref-type="bibr" rid="B67">2002</xref>), implementing tools for characterizing system failure (Nushi et al., <xref ref-type="bibr" rid="B143">2018</xref>), as well as using transparency and inspection mechanisms (Hauer et al., <xref ref-type="bibr" rid="B86">2023</xref>). So called &#x0201C;algorithmic accountability&#x0201D; is also described as the expectation that people along the AI-lifecycle (see Section 2) will comply with legislation and standards to ensure the proper and safe use of AI and involves not only the use, design, implementation, and consequences but the whole &#x0201C;socio-technical process&#x0201D; (Hauer et al., <xref ref-type="bibr" rid="B86">2023</xref>; Novelli et al., <xref ref-type="bibr" rid="B141">2023</xref>; Wieringa, <xref ref-type="bibr" rid="B195">2020</xref>). Thus, accountability shall ensure compliance with requirements such as fairness, transparency, and robustness (Durante and Floridi, <xref ref-type="bibr" rid="B60">2022</xref>; Novelli et al., <xref ref-type="bibr" rid="B141">2023</xref>). Therefore, it also requires that mechanisms for auditability, minimization, and reporting of negative impacts, trade-offs, and redress are in place. Therefore, accountability must be ensured along the whole AI-lifecycle&#x02014;in the design phase, the development phase, and the deployment phase.</p></sec>
<sec>
<title>3.6.3 Methods to evaluate accountability</title>
<p>Due to the versatility of accountability, its evaluation is challenging. Numerous approaches for evaluating accountability regarding AI systems are put forth.<xref ref-type="fn" rid="fn0006"><sup>6</sup></xref> For example, Tagiou et al. (<xref ref-type="bibr" rid="B179">2019</xref>) suggest a &#x0201C;a tool-supported framework for the assessment of algorithmic accountability&#x0201D; that focuses on both algorithmic and organizational aspects and Cech (<xref ref-type="bibr" rid="B50">2021</xref>) proposes the &#x0201C;<italic>Accountability Agency Framework (A3)</italic>&#x0201D; as an analytic lens as a qualitative, explorative, and complementary tool to assess algorithmic accountability, which is based on Bovens (<xref ref-type="bibr" rid="B36">2007</xref>)&#x00027;s definition of accountability. Their framework encompasses four steps: requesting information, providing account, imposing consequences, and effective change. Additionally, it provides a series of guiding questions for assessing algorithmic accountability (Cech, <xref ref-type="bibr" rid="B50">2021</xref>). Xia et al. (<xref ref-type="bibr" rid="B199">2024</xref>) proposed a granular AI Metrics catalog that includes process, resource, and product metrics and is specially designed for generative AI. Besides, numerous other, mainly contextualized frameworks, which range from accountability in organizations (Buhmann and Christian, <xref ref-type="bibr" rid="B42">2019</xref>), public reason (Binns, <xref ref-type="bibr" rid="B31">2018</xref>) and public service (Brown et al., <xref ref-type="bibr" rid="B39">2019</xref>) to &#x0201C;AI robots accountability&#x0201D; (Toth et al., <xref ref-type="bibr" rid="B182">2022</xref>) frameworks have been proposed. From a qualitative perspective, approaches that, for instance, take human rights into account are discussed (McGregor et al., <xref ref-type="bibr" rid="B120">2019</xref>).</p>
<p>In general, Brandsma and Schillemans (<xref ref-type="bibr" rid="B38">2012</xref>) suggest a so-called &#x0201C;<italic>accountability cube</italic>&#x0201D; as a quantitative assessment tool for assessing accountability, considering three dimensions of accountability processes: information, discussion, and consequences/sanctions. Accordingly, accountability is &#x0201C;high&#x0201D; if there is much information, intensive discussions, and several opportunities to impose consequences. This approach can be applied in various contexts along the AI-lifecycle. Without any closer examination of the approach itself, we use the accountability cube to exemplify possible evaluation criteria of algorithmic accountability.</p>
<p>To start with, much information is given if people are aware of basic technical outlines, chances, and risks of AI in the respective context and know their obligations along the lifecycle of AI, including, for instance, information, documentation, and risk-assessment obligations. From our point of view, AI literacy is essential to this. Discussion is intensive if an informed exchange of views on AI systems and regulation&#x02014;whether formal or informal&#x02014;takes place between multiple stakeholders (e.g., policymakers, NGOs, technical experts, civil society, as well as companies and individuals). Besides, there shall be meaningful opportunities to explain actions (e.g., using certain design concepts/training data or using AI systems in certain situations). Finally, effective and proportionate consequences (e.g., penalties for non-compliance with rules and effective redress) shall be in scope. This, in turn, creates a need for clear and feasible rules.</p>
<p>Notably, the weight of these principles can vary. To exemplify, the &#x0201C;accountability rate&#x0201D; might still be high if there are clear non-binding standards with no legal consequences that are widely adhered whereas it is lower if there are binding rules that are not being followed due to societal rejection or inefficient enforcement. The weight of the principles might also vary in different contexts. For instance, in policymaking, intensive discussion might have a higher priority than in company internal processes.</p></sec>
<sec>
<title>3.6.4 Open issues and research challenges</title>
<p>In practice, evaluating algorithmic accountability poses severe problems. One of the biggest challenges is that algorithmic accountability is a &#x0201C;multifaceted and context-sensitive challenge&#x0201D; (Cech, <xref ref-type="bibr" rid="B50">2021</xref>). At present, standards, standardized methods, and metrics covering different aspects of the AI-lifecycle, from design to deployment, are still incomplete and, therefore, do not provide sufficient legal security. Vague terms confront norm addressees with legal uncertainty when interpreting these norms. In turn, organizations are unable to implement sufficient accountability mechanisms within their organization.</p>
<p>On the one hand, accountability gaps arise if rules are inconsistent, unclear, or not feasible, and therefore, they lead to ineffective redress of victims. On the other hand, rules which are too strict generate accountability surpluses, which in turn decrease technological and economic growth (Bovens, <xref ref-type="bibr" rid="B36">2007</xref>; Novelli et al., <xref ref-type="bibr" rid="B141">2023</xref>). AI policymakers aim to close these accountability gaps that might arise due to the unpredictable, opaque nature of AI systems (Novelli et al., <xref ref-type="bibr" rid="B141">2023</xref>; Busuioc, <xref ref-type="bibr" rid="B44">2020</xref>). Several measures, like model certification, algorithmic impact assessments, real-world testing, and third-party audits, could foster accountability (Busuioc, <xref ref-type="bibr" rid="B44">2020</xref>). Such measures are also included in the AI Act. For example, there are documentation, information, and transparency obligations for providers of high-risk AI systems, there are third-party checks, and testing in real-world laboratories is enabled. Rules are also amendable according to technical changes, demonstrating effective change if needed.</p>
<p>Notably, developing sufficient rules, including ethical and technical standards, that cover the whole AI-lifecycle is challenging, as AI systems are complex and based on various programming methods, developing rapidly and can have wide-ranging effects on people (Cech, <xref ref-type="bibr" rid="B50">2021</xref>). Generative AI systems seem to exacerbate this problem due to their large scale, complexity, and adaptability (Xia et al., <xref ref-type="bibr" rid="B199">2024</xref>). Consequently, it is particularly difficult to find suitable metrics for evaluating the trustworthiness of generative AI. To ensure &#x0201C;actionable&#x0201D; accountability, both technical and non-technical aspects, among them legal and ethical aspects, must be considered (Stix, <xref ref-type="bibr" rid="B177">2021</xref>). When creating rules and standards on AI, it is crucial to weigh up technical and economic aspects. An informed dialogue between policymakers, (technical) experts, and civil society is essential to reaching sufficient rules and avoiding unnecessary bureaucracy.</p></sec></sec></sec>
<sec id="s4">
<title>4 Conclusion and future research</title>
<p>In this paper, we investigated the following six requirements of trustworthy AI: (1) human agency and oversight, (2) fairness and non-discrimination, (3) transparency and explainability, (4) robustness and accuracy, (5) privacy and security, and (6) accountability. With respect to our guiding research question introduced in Section 1 (i.e., <italic>What is the current state of research regarding the establishment and evaluation of comprehensive&#x02014;technical, human-centered, and legal&#x02014;requirements of trustworthy AI?</italic>), our findings confirm that ensuring AI systems meet these criteria is a complex endeavor requiring technical solutions, policy frameworks, and interdisciplinary collaboration. Additionally, our article demonstrates that while evaluation and validation methodologies for technical requirements, such as robustness, can often rely on well-established metrics and testing procedures (e.g., model accuracy), assessing human-centric considerations demands more nuanced approaches that take into account ethical, legal, and cultural factors. Therefore, we believe that our article complements existing surveys and assessment lists [e.g., ALTAI (Ala-Pietil&#x000E4; et al., <xref ref-type="bibr" rid="B7">2020</xref>; Radclyffe et al., <xref ref-type="bibr" rid="B151">2023</xref>)] of trustworthy AI.</p>
<p>This section further synthesizes our key observations across these very different aspects of AI systems in relation to their trustworthiness and discusses the implications of this overarching analysis. Additionally, <xref ref-type="fig" rid="F4">Figure 4</xref> visualizes these overarching research challenges in relation to the phases of the AI-lifecycle mentioned in Section 2.</p><list list-type="bullet">
<list-item><p><bold>Interdisciplinary research</bold>. The interdisciplinary nature of trustworthy AI research becomes apparent when considering the different scientific foundations necessary to discuss the design, development, and deployment of trustworthy AI. This demand for interdisciplinarity is also recognized by initiatives like the human-centered AI (HCAI) workshops and sessions at AI conferences such as NeurIPS,<xref ref-type="fn" rid="fn0007"><sup>7</sup></xref> as well as the FAccT community&#x00027;s work on fairness, accountability, and transparency in AI.<xref ref-type="fn" rid="fn0008"><sup>8</sup></xref> However, broader collaboration is needed. In particular, insights from social scientists, ethicists, and policymakers can complement technical research, for example, in fairness definitions, explainability, or human oversight. At the same time, interdisciplinary research comes with its own challenges, such as distinct disciplinary-specific jargon. Thus, agreeing on standardized, cross-disciplinary terminology remains an ongoing challenge in various subjects.</p></list-item>
<list-item><p><bold>Conceptual clarity and interdependencies</bold>. Across all trustworthy AI requirements, we see the need to sharpen definitions and to consider interdependencies and relationships between concepts. This involves understanding the potential trade-offs between requirements, such as fairness and accuracy or explainability and privacy. Such conceptual clarity and knowledge of interdependencies will help in designing trustworthy AI with regard to specific requirements while allowing for informed discussions of trade-offs. Therefore, it is essential to consider potential trade-offs and interdependencies already when designing trustworthy AI systems.</p></list-item>
<list-item><p><bold>Context-dependency of trustworthiness</bold>. Our research indicates that AI requirements are very context-dependent. This means that any insights for developing trustworthy AI are challenging to transfer across different contexts due to cultural and application-specific aspects. Different interaction patterns between humans and AI will be appropriate in different contexts, and definitions of trustworthiness vary between societies and applications. This raises questions about the sufficiency of existing evaluation frameworks and suggests the need for new approaches that can better adapt to contextual differences. Additionally, if an audited algorithm is reused and fails to meet requirements in a different context, assigning responsibility becomes complex. Even more difficult is the handling of AI solutions that consist of multiple interacting components, i.e., composite systems. Understanding how different components interact and affect each other is crucial when algorithms are reused in conjunction with other components. Even if single components are considered trustworthy, the results of their interplay potentially violate the requirements of trustworthy AI. Such uncertainties affect the licensing and use of software frameworks, which emphasizes the importance of developing licensing models that clearly outline accountability while promoting the responsible use of AI.</p></list-item>
<list-item><p><bold>Dynamics in evolving systems</bold>. One of the emerging issues in trustworthy AI is the potential of learning unintended facets during deployment. In evolving systems (i.e., systems that learn during deployment), in particular, the capturing of biases may lead to trustworthiness issues, especially with respect to fairness and non-discrimination. Such biases are often cognitive biases of users, which are acquired through ongoing learning cycles and require more sophisticated research to form a deeper understanding of related patterns and furthermore, develop approaches for detection and mitigation. This concern also highlights the necessity of dynamic and adaptive evaluation and simulation frameworks. Since the majority of trustworthy AI evaluation schemes operate in a static manner, additional research is needed to investigate, monitor, and capture long-term dynamics of trustworthiness.</p></list-item>
<list-item><p><bold>Investigating trustworthy AI in real-world contexts</bold>. Due to the complexity of AI systems and their contextual dependencies, it is crucial to study their functionality in real-life contexts to gain a deeper understanding of their impact. The involvement of human factors, such as how a system is used by different people and how this fits into a complex socio-technical context, makes real-world investigations very challenging from a methodological standpoint. However, for some requirements on AI systems, such as fairness or human agency, this may be particularly important to the extent that fully valid statements about these concepts may only be made after investigation in real-world contexts. Thus, monitoring the trustworthiness of AI is an ongoing investigation, especially after the system has been deployed in a real-world context.</p></list-item>
</list>
<fig id="F4" position="float">
<label>Figure 4</label>
<caption><p>Overarching research challenges identified in this paper in relation to the AI-lifecycle phases.</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fdata-07-1467222-g0004.tif"/>
</fig>
<p>Finally, and as outlined in Sections 3.1&#x02013;3.6, the current developments around generative AI and LLMs introduce new challenges for establishing and evaluating trustworthy AI. Therefore, future research also needs to investigate how existing trustworthy AI methods and definitions (e.g., fairness metrics for binary classification problems) can be transformed into more general settings provided by generative AI and LLMs. We hope that our paper provides a reference point for both researchers and practitioners in the field of trustworthy AI and a starting point for future research directions addressing the open research challenges identified in this work and discussed in this section.</p></sec>
</body>
<back>
<sec sec-type="author-contributions" id="s5">
<title>Author contributions</title>
<p>DK: Conceptualization, Supervision, Writing &#x02013; original draft, Writing &#x02013; review &#x00026; editing. SS: Investigation, Writing &#x02013; original draft, Writing &#x02013; review &#x00026; editing. VP-S: Investigation, Writing &#x02013; original draft, Writing &#x02013; review &#x00026; editing. PM: Investigation, Writing &#x02013; original draft, Writing &#x02013; review &#x00026; editing. KW: Writing &#x02013; original draft, Writing &#x02013; review &#x00026; editing. LD: Writing &#x02013; original draft, Writing &#x02013; review &#x00026; editing. AF: Writing &#x02013; original draft, Writing &#x02013; review &#x00026; editing. MT: Writing &#x02013; original draft, Writing &#x02013; review &#x00026; editing. IM: Writing &#x02013; original draft, Writing &#x02013; review &#x00026; editing. I&#x00160;: Writing &#x02013; original draft, Writing &#x02013; review &#x00026; editing. VS: Writing &#x02013; original draft, Writing &#x02013; review &#x00026; editing. AT: Writing &#x02013; original draft, Writing &#x02013; review &#x00026; editing. EV: Writing &#x02013; original draft, Writing &#x02013; review &#x00026; editing. RK: Writing &#x02013; original draft, Writing &#x02013; review &#x00026; editing. TN: Investigation, Writing &#x02013; original draft, Writing &#x02013; review &#x00026; editing. SK: Conceptualization, Supervision, Writing &#x02013; original draft, Writing &#x02013; review &#x00026; editing.</p>
</sec>
<sec sec-type="funding-information" id="s6">
<title>Funding</title>
<p>The author(s) declare financial support was received for the research, authorship, and/or publication of this article. The work received funding from the TU Graz Open Access Publishing Fund.</p>
</sec>
<ack><p>Parts of this manuscript are based on white papers created by SGS Digital Trust Services GmbH and Know Center Research GmbH, which are available online via Zenodo: <ext-link ext-link-type="uri" xlink:href="https://zenodo.org/records/11207961">https://zenodo.org/records/11207961</ext-link>. Know Center Research GmbH is a COMET Center within the COMET&#x02014;Competence Centers for Excellent Technologies Program and funded by BMK, BMAW, as well as the co-financing provinces Styria, Vienna and Tyrol. COMET is managed by FFG.</p>
</ack>
<sec sec-type="COI-statement" id="conf1">
<title>Conflict of interest</title>
<p>DK, SS, VP-S, PM, KW, LD, AF, MT, IM, I&#x00160;, VS, AT, EV, RK, and SK were employed by Know Center Research GmbH. TN was employed by SGS Digital Services GmbH.</p>
</sec>
<sec sec-type="disclaimer" id="s7">
<title>Publisher&#x00027;s note</title>
<p>All claims expressed in this article are solely those of the authors and do not necessarily represent those of their affiliated organizations, or those of the publisher, the editors and the reviewers. Any product that may be evaluated in this article, or claim that may be made by its manufacturer, is not guaranteed or endorsed by the publisher.</p>
</sec>
<fn-group>
<fn id="fn0001"><p><sup>1</sup><ext-link ext-link-type="uri" xlink:href="https://www.europarl.europa.eu/doceo/document/TA-9-2024-0138_EN.pdf">https://www.europarl.europa.eu/doceo/document/TA-9-2024-0138_EN.pdf</ext-link></p></fn>
<fn id="fn0002"><p><sup>2</sup><ext-link ext-link-type="uri" xlink:href="https://incidentdatabase.ai/cite/19/&#x00023;r184">https://incidentdatabase.ai/cite/19/&#x00023;r184</ext-link></p></fn>
<fn id="fn0003"><p><sup>3</sup><ext-link ext-link-type="uri" xlink:href="https://incidentdatabase.ai/cite/92/&#x00023;r2037">https://incidentdatabase.ai/cite/92/&#x00023;r2037</ext-link></p></fn>
<fn id="fn0004"><p><sup>4</sup><ext-link ext-link-type="uri" xlink:href="https://incidentdatabase.ai/cite/357">https://incidentdatabase.ai/cite/357</ext-link></p></fn>
<fn id="fn0005"><p><sup>5</sup><ext-link ext-link-type="uri" xlink:href="https://digital-strategy.ec.europa.eu/en/library/ethics-guidelines-trustworthy-ai">https://digital-strategy.ec.europa.eu/en/library/ethics-guidelines-trustworthy-ai</ext-link></p></fn>
<fn id="fn0006"><p><sup>6</sup>In this article, we only present individual approaches as examples without any claim to completeness.</p></fn>
<fn id="fn0007"><p><sup>7</sup><ext-link ext-link-type="uri" xlink:href="https://hcai-at-neurips.github.io/site/">https://hcai-at-neurips.github.io/site/</ext-link></p></fn>
<fn id="fn0008"><p><sup>8</sup><ext-link ext-link-type="uri" xlink:href="https://facctconference.org/">https://facctconference.org/</ext-link></p></fn>
</fn-group>
<ref-list>
<title>References</title>
<ref id="B1">
<citation citation-type="book"><person-group person-group-type="author"><name><surname>Abadi</surname> <given-names>M.</given-names></name> <name><surname>Chu</surname> <given-names>A.</given-names></name> <name><surname>Goodfellow</surname> <given-names>I. J.</given-names></name> <name><surname>McMahan</surname> <given-names>H. B.</given-names></name> <name><surname>Mironov</surname> <given-names>I.</given-names></name> <name><surname>Talwar</surname> <given-names>K.</given-names></name> <etal/></person-group>. (<year>2016</year>). <article-title>&#x0201C;Deep learning with differential privacy,&#x0201D;</article-title> in <source>Proceedings of the 2016 ACM SIGSAC Conference on Computer and Communications Security</source>, eds. E. R. Weippl, S. Katzenbeisser, C. Kruegel, A. C. Myers, and S. Halevi (<publisher-loc>Vienna</publisher-loc>: <publisher-name>ACM</publisher-name>), <fpage>308</fpage>&#x02013;<lpage>318</lpage>.</citation>
</ref>
<ref id="B2">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Adadi</surname> <given-names>A.</given-names></name> <name><surname>Berrada</surname> <given-names>M.</given-names></name></person-group> (<year>2018</year>). <article-title>Peeking inside the black-box: a survey on explainable artificial intelligence (XAI)</article-title>. <source>IEEE Access</source> <volume>6</volume>, <fpage>52138</fpage>&#x02013;<lpage>52160</lpage>. <pub-id pub-id-type="doi">10.1109/ACCESS.2018.2870052</pub-id></citation>
</ref>
<ref id="B3">
<citation citation-type="book"><person-group person-group-type="author"><name><surname>Adebayo</surname> <given-names>J.</given-names></name> <name><surname>Gilmer</surname> <given-names>J.</given-names></name> <name><surname>Muelly</surname> <given-names>M.</given-names></name> <name><surname>Goodfellow</surname> <given-names>I.</given-names></name> <name><surname>Hardt</surname> <given-names>M.</given-names></name> <name><surname>Kim</surname> <given-names>B.</given-names></name></person-group> (<year>2018</year>). <article-title>&#x0201C;Sanity checks for saliency maps,&#x0201D;</article-title> in <source>Proceedings of the 32nd International Conference on Neural Information Processing Systems, NIPS&#x00027;18</source> (<publisher-loc>Red Hook, NY</publisher-loc>: <publisher-name>Curran Associates Inc.</publisher-name>), <fpage>9525</fpage>&#x02013;<lpage>9536</lpage>.</citation>
</ref>
<ref id="B4">
<citation citation-type="web"><person-group person-group-type="author"><name><surname>Adilova</surname> <given-names>L.</given-names></name> <name><surname>B&#x000F6;ttinger</surname> <given-names>K.</given-names></name> <name><surname>Danos</surname> <given-names>V.</given-names></name> <name><surname>Jakob</surname> <given-names>S.</given-names></name> <name><surname>Langer</surname> <given-names>F.</given-names></name> <name><surname>Markert</surname> <given-names>T.</given-names></name> <etal/></person-group>. (<year>2022</year>). <source>Security of AI-Systems: Fundamentals - Adversarial Deep Learning</source>. Available at: <ext-link ext-link-type="uri" xlink:href="https://www.bsi.bund.de/SharedDocs/Downloads/EN/BSI/KI/Security-of-AI-systems_fundamentals.html">https://www.bsi.bund.de/SharedDocs/Downloads/EN/BSI/KI/Security-of-AI-systems_fundamentals.html</ext-link> (accessed June, 2024).</citation>
</ref>
<ref id="B5">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Akbar</surname> <given-names>M. A.</given-names></name> <name><surname>Khan</surname> <given-names>A. A.</given-names></name> <name><surname>Mahmood</surname> <given-names>S.</given-names></name> <name><surname>Rafi</surname> <given-names>S.</given-names></name> <name><surname>Demi</surname> <given-names>S.</given-names></name></person-group> (<year>2024</year>). <article-title>Trustworthy artificial intelligence: a decision-making taxonomy of potential challenges</article-title>. <source>Softw. Pract. Exp</source>. <volume>54</volume>, <fpage>1621</fpage>&#x02013;<lpage>1650</lpage>. <pub-id pub-id-type="doi">10.1002/spe.3216</pub-id></citation>
</ref>
<ref id="B6">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Akula</surname> <given-names>R.</given-names></name> <name><surname>Garibay</surname> <given-names>I.</given-names></name></person-group> (<year>2021</year>). <article-title>Audit and assurance of ai algorithms: a framework to ensure ethical algorithmic practices in artificial intelligence</article-title>. <source>arXiv</source> [preprint]. <pub-id pub-id-type="doi">10.48550/arXiv.2107.14046</pub-id></citation>
</ref>
<ref id="B7">
<citation citation-type="book"><person-group person-group-type="author"><name><surname>Ala-Pietil&#x000E4;</surname> <given-names>P.</given-names></name> <name><surname>Bonnet</surname> <given-names>Y.</given-names></name> <name><surname>Bergmann</surname> <given-names>U.</given-names></name> <name><surname>Bielikova</surname> <given-names>M.</given-names></name> <name><surname>Bonefeld-Dahl</surname> <given-names>C.</given-names></name> <name><surname>Bauer</surname> <given-names>W.</given-names></name> <etal/></person-group>. (<year>2020</year>). <source>The Assessment List for Trustworthy Artificial Intelligence (ALTAI)</source>. <publisher-loc>Lausanne</publisher-loc>: <publisher-name>European Commission</publisher-name>.</citation>
</ref>
<ref id="B8">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Albahri</surname> <given-names>A. S.</given-names></name> <name><surname>Duhaim</surname> <given-names>A. M.</given-names></name> <name><surname>Fadhel</surname> <given-names>M. A.</given-names></name> <name><surname>Alnoor</surname> <given-names>A.</given-names></name> <name><surname>Baqer</surname> <given-names>N. S.</given-names></name> <name><surname>Alzubaidi</surname> <given-names>L.</given-names></name> <etal/></person-group>. (<year>2023</year>). <article-title>A systematic review of trustworthy and explainable artificial intelligence in healthcare: Assessment of quality, bias risk, and data fusion</article-title>. <source>Inf. Fus</source>. <volume>96</volume>, <fpage>156</fpage>&#x02013;<lpage>191</lpage>. <pub-id pub-id-type="doi">10.1016/j.inffus.2023.03.008</pub-id></citation>
</ref>
<ref id="B9">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Almanifi</surname> <given-names>O. R. A.</given-names></name> <name><surname>Chow</surname> <given-names>C.-O.</given-names></name> <name><surname>Tham</surname> <given-names>M.-L.</given-names></name> <name><surname>Chuah</surname> <given-names>J. H.</given-names></name> <name><surname>Kanesan</surname> <given-names>J.</given-names></name></person-group> (<year>2023</year>). <article-title>Communication and computation efficiency in federated learning: a survey</article-title>. <source>Int. Things</source> <volume>22</volume>:<fpage>100742</fpage>. <pub-id pub-id-type="doi">10.1016/j.iot.2023.100742</pub-id></citation>
</ref>
<ref id="B10">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Alvarez-Melis</surname> <given-names>D.</given-names></name> <name><surname>Jaakkola</surname> <given-names>T. S.</given-names></name></person-group> (<year>2018a</year>). <article-title>On the robustness of interpretability methods</article-title>. <source>arXiv</source> [preprint]. <pub-id pub-id-type="doi">10.48550/arXiv.1806.08049</pub-id></citation>
</ref>
<ref id="B11">
<citation citation-type="book"><person-group person-group-type="author"><name><surname>Alvarez-Melis</surname> <given-names>D.</given-names></name> <name><surname>Jaakkola</surname> <given-names>T. S.</given-names></name></person-group> (<year>2018b</year>). <article-title>&#x0201C;Towards robust interpretability with self-explaining neural networks,&#x0201D;</article-title> in <source>Proceedings of the 32nd International Conference on Neural Information Processing Systems</source> (<publisher-loc>NeurIPS</publisher-loc>), <fpage>7786</fpage>&#x02013;<lpage>7795</lpage>.</citation>
</ref>
<ref id="B12">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Anders</surname> <given-names>C. J.</given-names></name> <name><surname>Weber</surname> <given-names>L.</given-names></name> <name><surname>Neumann</surname> <given-names>D.</given-names></name> <name><surname>Samek</surname> <given-names>W.</given-names></name> <name><surname>M&#x000FC;ller</surname> <given-names>K.-R.</given-names></name> <name><surname>Lapuschkin</surname> <given-names>S.</given-names></name></person-group> (<year>2022</year>). <article-title>Finding and removing clever hans: using explanation methods to debug and improve deep models</article-title>. <source>Inf. Fus</source>. <volume>77</volume>, <fpage>261</fpage>&#x02013;<lpage>295</lpage>. <pub-id pub-id-type="doi">10.1016/j.inffus.2021.07.015</pub-id></citation>
</ref>
<ref id="B13">
<citation citation-type="book"><person-group person-group-type="author"><name><surname>Anderson</surname> <given-names>A.</given-names></name> <name><surname>Maystre</surname> <given-names>L.</given-names></name> <name><surname>Anderson</surname> <given-names>I.</given-names></name> <name><surname>Mehrotra</surname> <given-names>R.</given-names></name> <name><surname>Lalmas</surname> <given-names>M.</given-names></name></person-group> (<year>2020</year>). <article-title>&#x0201C;Algorithmic effects on the diversity of consumption on spotify,&#x0201D;</article-title> in <source>Proceedings of the Web Conference 2020</source> (<publisher-loc>New York, NY</publisher-loc>: <publisher-name>ACM</publisher-name>), <fpage>2155</fpage>&#x02013;<lpage>2165</lpage>.</citation>
</ref>
<ref id="B14">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Anderson</surname> <given-names>M.</given-names></name> <name><surname>Fort</surname> <given-names>K.</given-names></name></person-group> (<year>2022</year>). <article-title>Human where? A new scale defining human involvement in technology communities from an ethical standpoint</article-title>. <source>Int. Rev. Inf. Ethics</source>. 31. <pub-id pub-id-type="doi">10.29173/irie477</pub-id></citation>
</ref>
<ref id="B15">
<citation citation-type="book"><person-group person-group-type="author"><name><surname>Arias-Duart</surname> <given-names>A.</given-names></name> <name><surname>Par&#x000E9;s</surname> <given-names>F.</given-names></name> <name><surname>Garcia-Gasulla</surname> <given-names>D.</given-names></name> <name><surname>Gimenez-Abalos</surname> <given-names>V.</given-names></name></person-group> (<year>2022</year>). <article-title>&#x0201C;Focus! rating xai methods and finding biases,&#x0201D;</article-title> in <source>2022 IEEE International Conference on Fuzzy Systems (FUZZ-IEEE)</source> (<publisher-loc>New York, NY</publisher-loc>: <publisher-name>IEEE</publisher-name>), <fpage>1</fpage>&#x02013;<lpage>8</lpage>.</citation>
</ref>
<ref id="B16">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Arrieta</surname> <given-names>A. B.</given-names></name> <name><surname>D&#x000ED;az-Rodr&#x000ED;guez</surname> <given-names>N.</given-names></name> <name><surname>Del Ser</surname> <given-names>J.</given-names></name> <name><surname>Bennetot</surname> <given-names>A.</given-names></name> <name><surname>Tabik</surname> <given-names>S.</given-names></name> <name><surname>Barbado</surname> <given-names>A.</given-names></name> <etal/></person-group>. (<year>2020</year>). <article-title>Explainable artificial intelligence (XAI): concepts, taxonomies, opportunities and challenges toward responsible ai</article-title>. <source>Inf. Fus</source>. <volume>58</volume>, <fpage>82</fpage>&#x02013;<lpage>115</lpage>. <pub-id pub-id-type="doi">10.1016/j.inffus.2019.12.012</pub-id></citation>
</ref>
<ref id="B17">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Artelt</surname> <given-names>A.</given-names></name> <name><surname>Hammer</surname> <given-names>B.</given-names></name></person-group> (<year>2019</year>). <article-title>On the computation of counterfactual explanations - a survey</article-title>. <source>arXiv</source> [preprint]. <pub-id pub-id-type="doi">10.48550/arXiv.1911.07749</pub-id><pub-id pub-id-type="pmid">39067152</pub-id></citation></ref>
<ref id="B18">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Arya</surname> <given-names>V.</given-names></name> <name><surname>Bellamy</surname> <given-names>R. K.</given-names></name> <name><surname>Chen</surname> <given-names>P.-Y.</given-names></name> <name><surname>Dhurandhar</surname> <given-names>A.</given-names></name> <name><surname>Hind</surname> <given-names>M.</given-names></name> <name><surname>Hoffman</surname> <given-names>S. C.</given-names></name> <etal/></person-group>. (<year>2019</year>). <article-title>One explanation does not fit all: a toolkit and taxonomy of ai explainability techniques</article-title>. <source>arXiv</source> [preprint]. <pub-id pub-id-type="doi">10.1145/3351095.3375667</pub-id></citation>
</ref>
<ref id="B19">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Bae</surname> <given-names>H.</given-names></name> <name><surname>Jang</surname> <given-names>J.</given-names></name> <name><surname>Jung</surname> <given-names>D.</given-names></name> <name><surname>Jang</surname> <given-names>H.</given-names></name> <name><surname>Ha</surname> <given-names>H.</given-names></name> <name><surname>Yoon</surname> <given-names>S.</given-names></name></person-group> (<year>2018</year>). <article-title>Security and privacy issues in deep learning</article-title>. <source>arXiv</source> [preprint]. <pub-id pub-id-type="doi">10.48550/arXiv.1807.11655</pub-id></citation>
</ref>
<ref id="B20">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Baeza-Yates</surname> <given-names>R.</given-names></name></person-group> (<year>2018</year>). <article-title>Bias on the web</article-title>. <source>Commun. ACM</source> <volume>61</volume>, <fpage>54</fpage>&#x02013;<lpage>61</lpage>. <pub-id pub-id-type="doi">10.1145/3209581</pub-id></citation>
</ref>
<ref id="B21">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Bagdasaryan</surname> <given-names>E.</given-names></name> <name><surname>Poursaeed</surname> <given-names>O.</given-names></name> <name><surname>Shmatikov</surname> <given-names>V.</given-names></name></person-group> (<year>2019</year>). <article-title>Differential privacy has disparate impact on model accuracy</article-title>. <source>Adv. Neural Inf. Process. Syst</source>. 32.</citation>
</ref>
<ref id="B22">
<citation citation-type="book"><person-group person-group-type="author"><name><surname>Bagdasaryan</surname> <given-names>E.</given-names></name> <name><surname>Veit</surname> <given-names>A.</given-names></name> <name><surname>Hua</surname> <given-names>Y.</given-names></name> <name><surname>Estrin</surname> <given-names>D.</given-names></name> <name><surname>Shmatikov</surname> <given-names>V.</given-names></name></person-group> (<year>2020</year>). <article-title>&#x0201C;How to backdoor federated learning,&#x0201D;</article-title> in <source>International Conference on Artificial Intelligence and Statistics</source> (<publisher-loc>PMLR</publisher-loc>), <fpage>2938</fpage>&#x02013;<lpage>2948</lpage>.</citation>
</ref>
<ref id="B23">
<citation citation-type="web"><person-group person-group-type="author"><name><surname>Barocas</surname> <given-names>S.</given-names></name> <name><surname>Hardt</surname> <given-names>M.</given-names></name> <name><surname>Narayanan</surname> <given-names>A.</given-names></name></person-group> (<year>2021</year>). <source>Fairness and Machine Learning: Limitations and Opportunities</source>. Available at: <ext-link ext-link-type="uri" xlink:href="https://fairmlbook.org/">https://fairmlbook.org/</ext-link> (accesse June 19, 2019).</citation>
</ref>
<ref id="B24">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Barocas</surname> <given-names>S.</given-names></name> <name><surname>Hardt</surname> <given-names>M.</given-names></name> <name><surname>Narayanan</surname> <given-names>A.</given-names></name></person-group> (<year>2023</year>). <source>Fairness and Machine Learning: Limitations and Opportunities</source>. MIT Press.</citation>
</ref>
<ref id="B25">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Barocas</surname> <given-names>S.</given-names></name> <name><surname>Selbst</surname> <given-names>A. D.</given-names></name></person-group> (<year>2016</year>). <article-title>Big data&#x00027;s disparate impact</article-title>. <source>Calif. L. Rev</source>. <volume>104</volume>:<fpage>671</fpage>. <pub-id pub-id-type="doi">10.2139/ssrn.2477899</pub-id></citation>
</ref>
<ref id="B26">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Baxter</surname> <given-names>G.</given-names></name> <name><surname>Sommerville</surname> <given-names>I.</given-names></name></person-group> (<year>2010</year>). <article-title>Socio-technical systems: from design methods to systems engineering</article-title>. <source>Interact. Comput</source>. <volume>23</volume>, <fpage>4</fpage>&#x02013;<lpage>17</lpage>. <pub-id pub-id-type="doi">10.1016/j.intcom.2010.07.003</pub-id></citation>
</ref>
<ref id="B27">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Bellamy</surname> <given-names>R. K.</given-names></name> <name><surname>Dey</surname> <given-names>K.</given-names></name> <name><surname>Hind</surname> <given-names>M.</given-names></name> <name><surname>Hoffman</surname> <given-names>S. C.</given-names></name> <name><surname>Houde</surname> <given-names>S.</given-names></name> <name><surname>Kannan</surname> <given-names>K.</given-names></name> <etal/></person-group>. (<year>2019</year>). <article-title>AI fairness 360: an extensible toolkit for detecting and mitigating algorithmic bias</article-title>. <source>IBM J. Res. Dev</source>. <volume>63</volume>:<fpage>2942287</fpage>. <pub-id pub-id-type="doi">10.1147/JRD.2019.2942287</pub-id><pub-id pub-id-type="pmid">33813791</pub-id></citation></ref>
<ref id="B28">
<citation citation-type="book"><person-group person-group-type="author"><name><surname>Bennett</surname> <given-names>D.</given-names></name> <name><surname>Metatla</surname> <given-names>O.</given-names></name> <name><surname>Roudaut</surname> <given-names>A.</given-names></name> <name><surname>Mekler</surname> <given-names>E. D.</given-names></name></person-group> (<year>2023</year>). <article-title>&#x0201C;How does HCI understand human agency and autonomy?,&#x0201D;</article-title> in <source>Proceedings of the 2023 CHI Conference on Human Factors in Computing Systems</source> (<publisher-loc>New York, NY</publisher-loc>: <publisher-name>ACM</publisher-name>), <fpage>1</fpage>&#x02013;<lpage>18</lpage>.</citation>
</ref>
<ref id="B29">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Bhatt</surname> <given-names>U.</given-names></name> <name><surname>Weller</surname> <given-names>A.</given-names></name> <name><surname>Moura</surname> <given-names>J. M. F.</given-names></name></person-group> (<year>2020</year>). <article-title>&#x0201C;Evaluating and aggregating feature-based model explanations,&#x0201D;</article-title> in <source>Proceedings of the Twenty-Ninth International Joint Conference on Artificial Intelligence, IJCAI-20, 3016-3022. International Joint Conferences on Artificial Intelligence Organization</source>, ed. C. Bessiere. (Washington, DC: AAAI Press).</citation>
</ref>
<ref id="B30">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Biecek</surname> <given-names>P.</given-names></name></person-group> (<year>2018</year>). <article-title>Dalex: explainers for complex predictive models in R</article-title>. <source>J. Mach.Learn. Res</source>. <volume>19</volume>, <fpage>1</fpage>&#x02013;<lpage>5</lpage>.</citation>
</ref>
<ref id="B31">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Binns</surname> <given-names>R.</given-names></name></person-group> (<year>2018</year>). <article-title>Algorithmic accountability and public reason</article-title>. <source>Philos. Technol</source>. <volume>31</volume>, <fpage>1</fpage>&#x02013;<lpage>14</lpage>. <pub-id pub-id-type="doi">10.1007/s13347-017-0263-5</pub-id><pub-id pub-id-type="pmid">30873342</pub-id></citation></ref>
<ref id="B32">
<citation citation-type="book"><person-group person-group-type="author"><name><surname>Bird</surname> <given-names>S.</given-names></name> <name><surname>Dud&#x000ED;k</surname> <given-names>M.</given-names></name> <name><surname>Edgar</surname> <given-names>R.</given-names></name> <name><surname>Horn</surname> <given-names>B.</given-names></name> <name><surname>Lutz</surname> <given-names>R.</given-names></name> <name><surname>Milan</surname> <given-names>V.</given-names></name> <etal/></person-group>. (<year>2020</year>). <source>Fairlearn: A Toolkit for Assessing and Improving Fairness in AI</source>. <publisher-loc>Technical Report MSR-TR-2020-32, Microsoft. Washington, DC</publisher-loc>: <publisher-name>ACM</publisher-name>.</citation>
</ref>
<ref id="B33">
<citation citation-type="book"><person-group person-group-type="author"><name><surname>Bird</surname> <given-names>S.</given-names></name> <name><surname>Kenthapadi</surname> <given-names>K.</given-names></name> <name><surname>Kiciman</surname> <given-names>E.</given-names></name> <name><surname>Mitchell</surname> <given-names>M.</given-names></name></person-group> (<year>2019</year>). <article-title>&#x0201C;Fairness-aware machine learning: practical challenges and lessons learned,&#x0201D;</article-title> in <source>Proceedings of the Twelfth ACM International Conference on Web Search and Data Mining</source> (<publisher-loc>New York, NY</publisher-loc>: <publisher-name>ACM</publisher-name>), <fpage>834</fpage>&#x02013;<lpage>835</lpage>.</citation>
</ref>
<ref id="B34">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Bivins</surname> <given-names>T. H.</given-names></name></person-group> (<year>2006</year>). <article-title>&#x0201C;Responsibility and accountability,&#x0201D;</article-title> in <source>Ethics in Public Relations: Responsible Advocacy</source>, eds. K. Fitzpatrick and C. Bronstein (SAGE Publications, Inc.), <fpage>19</fpage>&#x02013;<lpage>38</lpage>.</citation>
</ref>
<ref id="B35">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Blanchard</surname> <given-names>G.</given-names></name> <name><surname>Lee</surname> <given-names>G.</given-names></name> <name><surname>Scott</surname> <given-names>C.</given-names></name></person-group> (<year>2011</year>). <article-title>Generalizing from several related classification tasks to a new unlabeled sample</article-title>. <source>Adv. Neural Inf. Process. Syst</source>. 24.<pub-id pub-id-type="pmid">30807567</pub-id></citation></ref>
<ref id="B36">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Bovens</surname> <given-names>M.</given-names></name></person-group> (<year>2007</year>). <article-title>Analysing and assessing accountability: a conceptual framework1</article-title>. <source>Eur. L. J</source>. <volume>13</volume>, <fpage>447</fpage>&#x02013;<lpage>468</lpage>. <pub-id pub-id-type="doi">10.1111/j.1468-0386.2007.00378.x</pub-id></citation>
</ref>
<ref id="B37">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Bovens</surname> <given-names>M.</given-names></name></person-group> (<year>2010</year>). <article-title>Two concepts of accountability: accountability as a virtue and as a mechanism</article-title>. <source>West Eur. Polit</source>. <volume>33</volume>, <fpage>946</fpage>&#x02013;<lpage>967</lpage>. <pub-id pub-id-type="doi">10.1080/01402382.2010.486119</pub-id></citation>
</ref>
<ref id="B38">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Brandsma</surname> <given-names>G.</given-names></name> <name><surname>Schillemans</surname> <given-names>T.</given-names></name></person-group> (<year>2012</year>). <article-title>The accountability cube: measuring accountability</article-title>. <source>J. Public Administ. Res. Theory</source> <volume>23</volume>, <fpage>953</fpage>&#x02013;<lpage>975</lpage>. <pub-id pub-id-type="doi">10.1093/jopart/mus034</pub-id></citation>
</ref>
<ref id="B39">
<citation citation-type="book"><person-group person-group-type="author"><name><surname>Brown</surname> <given-names>A.</given-names></name> <name><surname>Chouldechova</surname> <given-names>A.</given-names></name> <name><surname>Putnam-Hornstein</surname> <given-names>E.</given-names></name> <name><surname>Tobin</surname> <given-names>A.</given-names></name> <name><surname>Vaithianathan</surname> <given-names>R.</given-names></name></person-group> (<year>2019</year>). <article-title>&#x0201C;Toward algorithmic accountability in public services: a qualitative study of affected community perspectives on algorithmic decision-making in child welfare services,&#x0201D;</article-title> in <source>Proceedings of the 2019 CHI Conference on Human Factors in Computing Systems</source> (<publisher-loc>New York, NY</publisher-loc>: <publisher-name>ACM</publisher-name>), <fpage>1</fpage>&#x02013;<lpage>12</lpage>.</citation>
</ref>
<ref id="B40">
<citation citation-type="book"><person-group person-group-type="author"><name><surname>Brown</surname> <given-names>H.</given-names></name> <name><surname>Lee</surname> <given-names>K.</given-names></name> <name><surname>Mireshghallah</surname> <given-names>F.</given-names></name> <name><surname>Shokri</surname> <given-names>R.</given-names></name> <name><surname>Tram&#x000E8;r</surname> <given-names>F.</given-names></name></person-group> (<year>2022</year>). <article-title>&#x0201C;What does it mean for a language model to preserve privacy?,&#x0201D;</article-title> in <source>Proceedings of the 2022 ACM Conference on Fairness, Accountability, and Transparency</source> (<publisher-loc>ACM</publisher-loc>), <fpage>2280</fpage>&#x02013;<lpage>2292</lpage>.</citation>
</ref>
<ref id="B41">
<citation citation-type="web"><person-group person-group-type="author"><collab>BSI</collab></person-group> (<year>2022</year>). <source>AI Security Concerns in a Nutshell</source>. Available at: <ext-link ext-link-type="uri" xlink:href="https://www.bsi.bund.de/SharedDocs/Downloads/EN/BSI/KI/Practical_Al-Security_Guide_2023.html">https://www.bsi.bund.de/SharedDocs/Downloads/EN/BSI/KI/Practical_Al-Security_Guide_2023.html</ext-link> (accessed June, 2024).</citation>
</ref>
<ref id="B42">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Buhmann</surname> <given-names>P.</given-names></name> <name><surname>Pa&#x000DF;mann</surname> <given-names>A.</given-names></name> <name><surname>Christian</surname> <given-names>F.</given-names></name></person-group> (<year>2019</year>). <article-title>Managing algorithmic accountability: Balancing reputational concerns, engagement strategies, and the potential of rational discourse</article-title>. <source>J. Bus. Ethics</source> <volume>163</volume>, <fpage>265</fpage>&#x02013;<lpage>280</lpage>. <pub-id pub-id-type="doi">10.1007/s10551-019-04226-4</pub-id></citation>
</ref>
<ref id="B43">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Buolamwini</surname> <given-names>J.</given-names></name> <name><surname>Gebru</surname> <given-names>T.</given-names></name></person-group> (<year>2018</year>). <article-title>&#x0201C;Gender shades: Intersectional accuracy disparities in commercial gender classification,&#x0201D;</article-title> in <source>Proceedings of the 1st Conference on Fairness, Accountability and Transparency, volume 81 of Proceedings of Machine Learning Research</source>, eds. S. A. Friedler, and C. Wilson (PMLR), <fpage>77</fpage>&#x02013;<lpage>91</lpage>.</citation>
</ref>
<ref id="B44">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Busuioc</surname> <given-names>M.</given-names></name></person-group> (<year>2020</year>). <article-title>Accountable artificial intelligence: Holding algorithms to account</article-title>. <source>Public Adm. Rev</source>. <volume>81</volume>:<fpage>13293</fpage>. <pub-id pub-id-type="doi">10.1111/puar.13293</pub-id><pub-id pub-id-type="pmid">34690372</pub-id></citation></ref>
<ref id="B45">
<citation citation-type="book"><person-group person-group-type="author"><name><surname>Calders</surname> <given-names>T.</given-names></name> <name><surname>Kamiran</surname> <given-names>F.</given-names></name> <name><surname>Pechenizkiy</surname> <given-names>M.</given-names></name></person-group> (<year>2009</year>). <article-title>&#x0201C;Building classifiers with independency constraints,&#x0201D;</article-title> in <source>2009 IEEE International Conference on Data Mining Workshops</source> (<publisher-loc>New York, NY</publisher-loc>: <publisher-name>IEEE</publisher-name>), <fpage>13</fpage>&#x02013;<lpage>18</lpage>.</citation>
</ref>
<ref id="B46">
<citation citation-type="book"><person-group person-group-type="author"><name><surname>Calmon</surname> <given-names>F.</given-names></name> <name><surname>Wei</surname> <given-names>D.</given-names></name> <name><surname>Vinzamuri</surname> <given-names>B.</given-names></name> <name><surname>Natesan Ramamurthy</surname> <given-names>K.</given-names></name> <name><surname>Varshney</surname> <given-names>K. R.</given-names></name></person-group> (<year>2017</year>). <article-title>&#x0201C;Optimized pre-processing for discrimination prevention,&#x0201D;</article-title> in <source>NIPS&#x00027;17: Proceedings of the 31st International Conference on Neural Information Processing Systems</source> (<publisher-loc>MIT Press</publisher-loc>).</citation>
</ref>
<ref id="B47">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Cao</surname> <given-names>L.</given-names></name></person-group> (<year>2022</year>). <article-title>Ai in finance: challenges, techniques, and opportunities</article-title>. <source>ACM Comp. Surv</source>. <volume>55</volume>, <fpage>1</fpage>&#x02013;<lpage>38</lpage>. <pub-id pub-id-type="doi">10.1145/3502289</pub-id></citation>
</ref>
<ref id="B48">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Carter</surname> <given-names>S.</given-names></name> <name><surname>Armstrong</surname> <given-names>Z.</given-names></name> <name><surname>Schubert</surname> <given-names>L.</given-names></name> <name><surname>Johnson</surname> <given-names>I.</given-names></name> <name><surname>Olah</surname> <given-names>C.</given-names></name></person-group> (<year>2019</year>). <article-title>Activation atlas</article-title>. <source>Distill</source> <volume>4</volume>:<fpage>e15</fpage>. <pub-id pub-id-type="doi">10.23915/distill.00015</pub-id></citation>
</ref>
<ref id="B49">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Carvalho</surname> <given-names>D. V.</given-names></name> <name><surname>Pereira</surname> <given-names>E. M.</given-names></name> <name><surname>Cardoso</surname> <given-names>J. S.</given-names></name></person-group> (<year>2019</year>). <article-title>Machine learning interpretability: a survey on methods and metrics</article-title>. <source>Electronics</source> <volume>8</volume>:<fpage>832</fpage>. <pub-id pub-id-type="doi">10.3390/electronics8080832</pub-id></citation>
</ref>
<ref id="B50">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Cech</surname> <given-names>F.</given-names></name></person-group> (<year>2021</year>). <article-title>The agency of the forum: mechanisms for algorithmic accountability through the lens of agency</article-title>. <source>J. Respons. Technol</source>. 7&#x02013;<volume>8</volume>:<fpage>100015</fpage>. <pub-id pub-id-type="doi">10.1016/j.jrt.2021.100015</pub-id></citation>
</ref>
<ref id="B51">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Chang</surname> <given-names>H.-C. H.</given-names></name> <name><surname>Bui</surname> <given-names>M.</given-names></name> <name><surname>McIlwain</surname> <given-names>C.</given-names></name></person-group> (<year>2021</year>). <article-title>Targeted ads and/as racial discrimination: Exploring trends in new york city ads for college scholarships</article-title>. <source>arXiv</source> [preprint]. <pub-id pub-id-type="doi">10.24251/HICSS.2022.348</pub-id></citation>
</ref>
<ref id="B52">
<citation citation-type="book"><person-group person-group-type="author"><name><surname>Chatila</surname> <given-names>R.</given-names></name> <name><surname>Dignum</surname> <given-names>V.</given-names></name> <name><surname>Fisher</surname> <given-names>M.</given-names></name> <name><surname>Giannotti</surname> <given-names>F.</given-names></name> <name><surname>Morik</surname> <given-names>K.</given-names></name> <name><surname>Russell</surname> <given-names>S.</given-names></name> <etal/></person-group>. (<year>2021</year>). <source>Trustworthy AI. Reflections on Artificial Intelligence for Humanity</source> (<publisher-loc>New York, NY</publisher-loc>: <publisher-name>Springer</publisher-name>), <fpage>13</fpage>&#x02013;<lpage>39</lpage>.<pub-id pub-id-type="pmid">38694954</pub-id></citation></ref>
<ref id="B53">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Chen</surname> <given-names>Z.</given-names></name></person-group> (<year>2023</year>). <article-title>Ethics and discrimination in artificial intelligence-enabled recruitment practices</article-title>. <source>Human. Soc. Sci. Commun</source>. <volume>10</volume>, <fpage>1</fpage>&#x02013;<lpage>12</lpage>. <pub-id pub-id-type="doi">10.1057/s41599-023-02079-x</pub-id></citation>
</ref>
<ref id="B54">
<citation citation-type="book"><person-group person-group-type="author"><name><surname>Costanza-Chock</surname> <given-names>S.</given-names></name> <name><surname>Raji</surname> <given-names>I. D.</given-names></name> <name><surname>Buolamwini</surname> <given-names>J.</given-names></name></person-group> (<year>2022</year>). <article-title>&#x0201C;Who audits the auditors? recommendations from a field scan of the algorithmic auditing ecosystem,&#x0201D;</article-title> in <source>Proceedings of the 2022 ACM Conference on Fairness, Accountability, and Transparency</source> (<publisher-loc>New York, NY</publisher-loc>: <publisher-name>ACM</publisher-name>), <fpage>1571</fpage>&#x02013;<lpage>1583</lpage>.</citation>
</ref>
<ref id="B55">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Debenedetti</surname> <given-names>E.</given-names></name> <name><surname>Severi</surname> <given-names>G.</given-names></name> <name><surname>Carlini</surname> <given-names>N.</given-names></name> <name><surname>Choquette-Choo</surname> <given-names>C. A.</given-names></name> <name><surname>Jagielski</surname> <given-names>M.</given-names></name> <name><surname>Nasr</surname> <given-names>M.</given-names></name> <etal/></person-group>. (<year>2023</year>). <article-title>Privacy side channels in machine learning systems</article-title>. <source>arXiv</source> [preprint]. <pub-id pub-id-type="doi">10.48550/arXiv.2309.05610</pub-id></citation>
</ref>
<ref id="B56">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Dennerlein</surname> <given-names>S.</given-names></name> <name><surname>Wolf-Brenner</surname> <given-names>C.</given-names></name> <name><surname>Gutounig</surname> <given-names>R.</given-names></name> <name><surname>Schweiger</surname> <given-names>S.</given-names></name> <name><surname>Pammer-Schindler</surname> <given-names>V.</given-names></name></person-group> (<year>2020</year>). <article-title>&#x0201C;Guiding socio-technical reflection of ethical principles in tel software development: the srep framework,&#x0201D;</article-title> in <source>Addressing Global Challenges and Quality Education</source>, eds. C. Alario-Hoyos, M. J. Rodr&#x000ED;guez-Triana, M. Scheffel, I., Arnedillo-S&#x000E1;nchez, and S. M. Dennerlein (Cham: Springer International Publishing), <fpage>386</fpage>&#x02013;<lpage>391</lpage>.</citation>
</ref>
<ref id="B57">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>D&#x000ED;az-Rodr&#x000ED;guez</surname> <given-names>N.</given-names></name> <name><surname>Del Ser</surname> <given-names>J.</given-names></name> <name><surname>Coeckelbergh</surname> <given-names>M.</given-names></name> <name><surname>de Prado</surname> <given-names>M. L.</given-names></name> <name><surname>Herrera-Viedma</surname> <given-names>E.</given-names></name> <name><surname>Herrera</surname> <given-names>F.</given-names></name></person-group> (<year>2023</year>). <article-title>Connecting the dots in trustworthy artificial intelligence: from AI principles, ethics, and key requirements to responsible ai systems and regulation</article-title>. <source>Inf. Fus</source>. <volume>99</volume>:<fpage>101896</fpage>. <pub-id pub-id-type="doi">10.1016/j.inffus.2023.101896</pub-id></citation>
</ref>
<ref id="B58">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Doshi-Velez</surname> <given-names>F.</given-names></name> <name><surname>Kim</surname> <given-names>B.</given-names></name></person-group> (<year>2017</year>). <article-title>Towards a rigorous science of interpretable machine learning</article-title>. <source>arXiv</source> [preprint]. <pub-id pub-id-type="doi">10.48550/arXiv.1702.08608</pub-id></citation>
</ref>
<ref id="B59">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Dubal</surname> <given-names>V.</given-names></name></person-group> (<year>2023</year>). <article-title>On algorithmic wage discrimination</article-title>. <source>Columbia Law Rev</source>. <volume>123</volume>, <fpage>1929</fpage>&#x02013;<lpage>1992</lpage>. <pub-id pub-id-type="doi">10.2139/ssrn.4331080</pub-id></citation>
</ref>
<ref id="B60">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Durante</surname> <given-names>M.</given-names></name> <name><surname>Floridi</surname> <given-names>L.</given-names></name></person-group> (<year>2022</year>). <article-title>&#x0201C;A legal principles-based framework for ai liability regulation,&#x0201D;</article-title> in <source>The 2021 Yearbook of the Digital Ethics Lab</source>, eds. J. M&#x000F6;kander and M. Ziosi (New York, NY: Springer), <fpage>93</fpage>&#x02013;<lpage>112</lpage>.</citation>
</ref>
<ref id="B61">
<citation citation-type="book"><person-group person-group-type="author"><name><surname>Dutta</surname> <given-names>S.</given-names></name> <name><surname>Wei</surname> <given-names>D.</given-names></name> <name><surname>Yueksel</surname> <given-names>H.</given-names></name> <name><surname>Chen</surname> <given-names>P.-Y.</given-names></name> <name><surname>Liu</surname> <given-names>S.</given-names></name> <name><surname>Varshney</surname> <given-names>K.</given-names></name></person-group> (<year>2020</year>). <article-title>&#x0201C;Is there a trade-off between fairness and accuracy? a perspective using mismatched hypothesis testing,&#x0201D;</article-title> in <source>International Conference on Machine Learning</source> (<publisher-loc>PMLR</publisher-loc>), <fpage>2803</fpage>&#x02013;<lpage>2813</lpage>.</citation>
</ref>
<ref id="B62">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Dwork</surname> <given-names>C.</given-names></name></person-group> (<year>2008</year>). <article-title>&#x0201C;Differential privacy: a survey of results,&#x0201D;</article-title> in <source>Theory and Applications of Models of Computation, 5th International Conference, TAMC 2008, Xi&#x00027;an, China, April 25-29, 2008. Proceedings, volume 4978 of Lecture Notes in Computer Science</source>, eds. M. Agrawal, D. Du, Z. Duan, and A. Li (Springer), <fpage>1</fpage>&#x02013;<lpage>19</lpage>.</citation>
</ref>
<ref id="B63">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Dwork</surname> <given-names>C.</given-names></name> <name><surname>Roth</surname> <given-names>A.</given-names></name></person-group> (<year>2014</year>). <article-title>The algorithmic foundations of differential privacy</article-title>. <source>Found. Trends Theor. Comput. Sci</source>. <volume>9</volume>, <fpage>211</fpage>&#x02013;<lpage>407</lpage>. <pub-id pub-id-type="doi">10.1561/0400000042</pub-id></citation>
</ref>
<ref id="B64">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Elliott</surname> <given-names>D.</given-names></name> <name><surname>Soifer</surname> <given-names>E.</given-names></name></person-group> (<year>2022</year>). <article-title>Ai technologies, privacy, and security</article-title>. <source>Front. Artif. Intell</source>. <volume>5</volume>:<fpage>826737</fpage>. <pub-id pub-id-type="doi">10.3389/frai.2022.826737</pub-id><pub-id pub-id-type="pmid">35493613</pub-id></citation></ref>
<ref id="B65">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Emaminejad</surname> <given-names>N.</given-names></name> <name><surname>Akhavian</surname> <given-names>R.</given-names></name></person-group> (<year>2022</year>). <article-title>Trustworthy AI and robotics: implications for the aec industry</article-title>. <source>Automat. Construct</source>. <volume>139</volume>:<fpage>104298</fpage>. <pub-id pub-id-type="doi">10.1016/j.autcon.2022.104298</pub-id></citation>
</ref>
<ref id="B66">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Eraut</surname> <given-names>M.</given-names></name></person-group> (<year>2004</year>). <article-title>Informal learning in the workplace</article-title>. <source>Stud. Contin. Educ</source>. <volume>26</volume>, <fpage>247</fpage>&#x02013;<lpage>273</lpage>. <pub-id pub-id-type="doi">10.1080/158037042000225245</pub-id></citation>
</ref>
<ref id="B67">
<citation citation-type="book"><person-group person-group-type="author"><name><surname>Eriks&#x000E9;n</surname> <given-names>S.</given-names></name></person-group> (<year>2002</year>). <article-title>&#x0201C;Designing for accountability,&#x0201D;</article-title> in <source>Proceedings of the Second Nordic Conference on Human-Computer Interaction</source> (<publisher-loc>New York, NY</publisher-loc>: <publisher-name>ACM</publisher-name>), <fpage>177</fpage>&#x02013;<lpage>186</lpage>.</citation>
</ref>
<ref id="B68">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Evans</surname> <given-names>D.</given-names></name> <name><surname>Kolesnikov</surname> <given-names>V.</given-names></name> <name><surname>Rosulek</surname> <given-names>M.</given-names></name></person-group> (<year>2018</year>). <article-title>A pragmatic introduction to secure multi-party computation</article-title>. <source>Found. Trends Priv. Secur</source>. <volume>2</volume>, <fpage>70</fpage>&#x02013;<lpage>246</lpage>. <pub-id pub-id-type="doi">10.1561/9781680835090</pub-id></citation>
</ref>
<ref id="B69">
<citation citation-type="book"><person-group person-group-type="author"><name><surname>Fancher</surname> <given-names>D.</given-names></name> <name><surname>Ammanath</surname> <given-names>B.</given-names></name> <name><surname>Holdowsky</surname> <given-names>J.</given-names></name> <name><surname>Natasha</surname> <given-names>B.</given-names></name></person-group> (<year>2021</year>). <source>Deloitte. Insights AI Model Bias Can Damage Trust More Than You May Know. But it Doesn&#x00027;t Have To</source> (<publisher-loc>London</publisher-loc>: <publisher-name>Deloitte Development LLC</publisher-name>).</citation>
</ref>
<ref id="B70">
<citation citation-type="book"><person-group person-group-type="author"><name><surname>Fanni</surname> <given-names>R.</given-names></name> <name><surname>Steinkogler</surname> <given-names>V. E.</given-names></name> <name><surname>Zampedri</surname> <given-names>G.</given-names></name> <name><surname>Pierson</surname> <given-names>J.</given-names></name></person-group> (<year>2020</year>). <article-title>&#x0201C;Active human agency in artificial intelligence mediation,&#x0201D;</article-title> in <source>Proceedings of the 6th EAI International Conference on Smart Objects and Technologies for Social Good</source> (<publisher-loc>Gent</publisher-loc>: <publisher-name>EAI</publisher-name>), <fpage>84</fpage>&#x02013;<lpage>89</lpage>.</citation>
</ref>
<ref id="B71">
<citation citation-type="book"><person-group person-group-type="author"><name><surname>Feldman</surname> <given-names>M.</given-names></name> <name><surname>Friedler</surname> <given-names>S. A.</given-names></name> <name><surname>Moeller</surname> <given-names>J.</given-names></name> <name><surname>Scheidegger</surname> <given-names>C.</given-names></name> <name><surname>Venkatasubramanian</surname> <given-names>S.</given-names></name></person-group> (<year>2015</year>). <article-title>&#x0201C;Certifying and removing disparate impact,&#x0201D;</article-title> in <source>Proceedings of the 21th ACM SIGKDD International Conference on Knowledge Discovery and Data Mining</source> (<publisher-loc>New York, NY</publisher-loc>: <publisher-name>ACM</publisher-name>), <fpage>259</fpage>&#x02013;<lpage>268</lpage>.</citation>
</ref>
<ref id="B72">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Fisher</surname> <given-names>R. A.</given-names></name></person-group> (<year>1922</year>). <article-title>On the mathematical foundations of theoretical statistics</article-title>. <source>Philos. Transact. R. Soc. London Ser. A</source> <volume>222</volume>, <fpage>309</fpage>&#x02013;<lpage>368</lpage>. <pub-id pub-id-type="doi">10.1098/rsta.1922.0009</pub-id></citation>
</ref>
<ref id="B73">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Floridi</surname> <given-names>L.</given-names></name></person-group> (<year>2021</year>). <article-title>Establishing the rules for building trustworthy AI</article-title>. <source>Ethics Govern. Policies Artif. Intell</source>. 41&#x02013;45. <pub-id pub-id-type="doi">10.1007/978-3-030-81907-1_4</pub-id></citation>
</ref>
<ref id="B74">
<citation citation-type="book"><person-group person-group-type="author"><name><surname>Fong</surname> <given-names>R. C.</given-names></name> <name><surname>Vedaldi</surname> <given-names>A.</given-names></name></person-group> (<year>2017</year>). <article-title>&#x0201C;Interpretable explanations of black boxes by meaningful perturbation,&#x0201D;</article-title> in <source>Proceedings of the IEEE International Conference on Computer Vision</source> (<publisher-loc>New York, NY</publisher-loc>: <publisher-name>IEEE</publisher-name>), <fpage>3429</fpage>&#x02013;<lpage>3437</lpage>.<pub-id pub-id-type="pmid">38257608</pub-id></citation></ref>
<ref id="B75">
<citation citation-type="book"><person-group person-group-type="author"><name><surname>Friedler</surname> <given-names>S. A.</given-names></name> <name><surname>Scheidegger</surname> <given-names>C.</given-names></name> <name><surname>Venkatasubramanian</surname> <given-names>S.</given-names></name> <name><surname>Choudhary</surname> <given-names>S.</given-names></name> <name><surname>Hamilton</surname> <given-names>E. P.</given-names></name> <name><surname>Roth</surname> <given-names>D.</given-names></name></person-group> (<year>2019</year>). <article-title>&#x0201C;A comparative study of fairness-enhancing interventions in machine learning,&#x0201D;</article-title> in <source>Proceedings of the Conference on Fairness, Accountability, and Transparency</source> (<publisher-loc>New York, NY</publisher-loc>: <publisher-name>ACM</publisher-name>), <fpage>329</fpage>&#x02013;<lpage>338</lpage>.</citation>
</ref>
<ref id="B76">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Friedman</surname> <given-names>A.</given-names></name> <name><surname>Berkovsky</surname> <given-names>S.</given-names></name> <name><surname>Kaafar</surname> <given-names>M. A.</given-names></name></person-group> (<year>2016</year>). <article-title>A differential privacy framework for matrix factorization recommender systems</article-title>. <source>User Model. User Adapt. Interact</source>. <volume>26</volume>, <fpage>425</fpage>&#x02013;<lpage>458</lpage>. <pub-id pub-id-type="doi">10.1007/s11257-016-9177-7</pub-id><pub-id pub-id-type="pmid">33739861</pub-id></citation></ref>
<ref id="B77">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Gabriel</surname> <given-names>A.</given-names></name> <name><surname>Le&#x000F3;n</surname> <given-names>E. K. C.</given-names></name> <name><surname>Wilkins</surname> <given-names>A.</given-names></name></person-group> (<year>2021</year>). <article-title>Accountability increases resource sharing: effects of accountability on human and AI system performance</article-title>. <source>Int. J. Human. Comp. Interact</source>. <volume>37</volume>, <fpage>434</fpage>&#x02013;<lpage>444</lpage>. <pub-id pub-id-type="doi">10.1080/10447318.2020.1824695</pub-id></citation>
</ref>
<ref id="B78">
<citation citation-type="book"><person-group person-group-type="author"><name><surname>Gao</surname> <given-names>D.</given-names></name> <name><surname>Liu</surname> <given-names>Y.</given-names></name> <name><surname>Huang</surname> <given-names>A.</given-names></name> <name><surname>Ju</surname> <given-names>C.</given-names></name> <name><surname>Yu</surname> <given-names>H.</given-names></name> <name><surname>Yang</surname> <given-names>Q.</given-names></name></person-group> (<year>2019</year>). <article-title>&#x0201C;Privacy-preserving heterogeneous federated transfer learning,&#x0201D;</article-title> in <source>2019 IEEE International Conference on Big Data (Big Data)</source> (<publisher-loc>New York, NY</publisher-loc>: <publisher-name>IEEE</publisher-name>), <fpage>2552</fpage>&#x02013;<lpage>2559</lpage>.</citation>
</ref>
<ref id="B79">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Garcia</surname> <given-names>L. P. F.</given-names></name> <name><surname>de Carvalho</surname> <given-names>A. C. P. L. F.</given-names></name> <name><surname>Lorena</surname> <given-names>A. C.</given-names></name></person-group> (<year>2015</year>). <article-title>Effect of label noise in the complexity of classification problems</article-title>. <source>Neurocomputing</source> <volume>160</volume>, <fpage>108</fpage>&#x02013;<lpage>119</lpage>. <pub-id pub-id-type="doi">10.1016/j.neucom.2014.10.085</pub-id></citation>
</ref>
<ref id="B80">
<citation citation-type="book"><person-group person-group-type="author"><name><surname>Gentry</surname> <given-names>C.</given-names></name></person-group> (<year>2009</year>). <source>A Fully Homomorphic Encryption Scheme</source>. <publisher-loc>Stanford, CA</publisher-loc>: <publisher-name>Stanford University</publisher-name>.</citation>
</ref>
<ref id="B81">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Guidotti</surname> <given-names>R.</given-names></name></person-group> (<year>2022</year>). <article-title>Counterfactual explanations and how to find them: literature review and benchmarking</article-title>. <source>Data Mining Knowl. Disc</source>. <volume>38</volume>, <fpage>1</fpage>&#x02013;<lpage>55</lpage>. <pub-id pub-id-type="doi">10.1007/s10618-022-00831-6</pub-id></citation>
</ref>
<ref id="B82">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Gulrajani</surname> <given-names>I.</given-names></name> <name><surname>Lopez-Paz</surname> <given-names>D.</given-names></name></person-group> (<year>2020</year>). <article-title>In search of lost domain generalization</article-title>. <source>arXiv</source> [preprint]. <pub-id pub-id-type="doi">10.48550/arXiv.2007.01434</pub-id></citation>
</ref>
<ref id="B83">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Haakman</surname> <given-names>M.</given-names></name> <name><surname>Cruz</surname> <given-names>L.</given-names></name> <name><surname>Huijgens</surname> <given-names>H.</given-names></name> <name><surname>van Deursen</surname> <given-names>A.</given-names></name></person-group> (<year>2021</year>). <article-title>AI lifecycle models need to be revised: an exploratory study in fintech</article-title>. <source>Empir. Softw. Eng</source>. <volume>26</volume>, <fpage>1</fpage>&#x02013;<lpage>29</lpage>. <pub-id pub-id-type="doi">10.1007/s10664-021-09993-1</pub-id></citation>
</ref>
<ref id="B84">
<citation citation-type="book"><person-group person-group-type="author"><name><surname>Hamon</surname> <given-names>R.</given-names></name> <name><surname>Junklewitz</surname> <given-names>H.</given-names></name> <name><surname>Sanchez</surname> <given-names>I.</given-names></name></person-group> (<year>2020</year>). <source>Robustness and Explainability of Artificial Intelligence</source>. <publisher-loc>Luxembourg</publisher-loc>: <publisher-name>Publications Office of the European Union</publisher-name> <volume>207</volume>:<fpage>2020</fpage>.</citation>
</ref>
<ref id="B85">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Han</surname> <given-names>S.</given-names></name> <name><surname>Lin</surname> <given-names>C.</given-names></name> <name><surname>Shen</surname> <given-names>C.</given-names></name> <name><surname>Wang</surname> <given-names>Q.</given-names></name> <name><surname>Guan</surname> <given-names>X.</given-names></name></person-group> (<year>2023</year>). <article-title>Interpreting adversarial examples in deep learning: a review</article-title>. <source>ACM Comp. Surv</source>. <volume>55</volume>, <fpage>1</fpage>&#x02013;<lpage>38</lpage>. <pub-id pub-id-type="doi">10.1145/3594869</pub-id></citation>
</ref>
<ref id="B86">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Hauer</surname> <given-names>M.</given-names></name> <name><surname>Krafft</surname> <given-names>T.</given-names></name> <name><surname>Zweig</surname> <given-names>K.</given-names></name></person-group> (<year>2023</year>). <article-title>Overview of transparency and inspectability mechanisms to achieve accountability of artificial intelligence systems</article-title>. <source>Data Policy</source> <volume>5</volume>:<fpage>30</fpage>. <pub-id pub-id-type="doi">10.1017/dap.2023.30</pub-id></citation>
</ref>
<ref id="B87">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Hedstr&#x000F6;m</surname> <given-names>A.</given-names></name> <name><surname>Weber</surname> <given-names>L.</given-names></name> <name><surname>Krakowczyk</surname> <given-names>D.</given-names></name> <name><surname>Bareeva</surname> <given-names>D.</given-names></name> <name><surname>Motzkus</surname> <given-names>F.</given-names></name> <name><surname>Samek</surname> <given-names>W.</given-names></name> <etal/></person-group>. (<year>2023</year>). <article-title>Quantus: an explainable ai toolkit for responsible evaluation of neural network explanations and beyond</article-title>. <source>J. Mach. Learni. Res</source>. <volume>24</volume>, <fpage>1</fpage>&#x02013;<lpage>11</lpage>.</citation>
</ref>
<ref id="B88">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Hendrycks</surname> <given-names>D.</given-names></name> <name><surname>Dietterich</surname> <given-names>T.</given-names></name></person-group> (<year>2019</year>). <article-title>Benchmarking neural network robustness to common corruptions and perturbations</article-title>. <source>arXiv</source> [preprint]. <pub-id pub-id-type="doi">10.48550/arXiv.1903.12261</pub-id><pub-id pub-id-type="pmid">34388516</pub-id></citation></ref>
<ref id="B89">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Hermann</surname> <given-names>E.</given-names></name></person-group> (<year>2022</year>). <article-title>Artificial intelligence and mass personalization of communication content&#x02014;an ethical and literacy perspective</article-title>. <source>New Media Soc</source>. <volume>24</volume>, <fpage>1258</fpage>&#x02013;<lpage>1277</lpage>. <pub-id pub-id-type="doi">10.1177/14614448211022702</pub-id></citation>
</ref>
<ref id="B90">
<citation citation-type="book"><person-group person-group-type="author"><collab>High-Level Expert Group on AI</collab></person-group> (<year>2019</year>). <source>Ethics Guidelines for Trustworthy AI</source>. <publisher-loc>Brussels</publisher-loc>: <publisher-name>Report, European Commission</publisher-name>.</citation>
</ref>
<ref id="B91">
<citation citation-type="book"><person-group person-group-type="author"><name><surname>Holzinger</surname> <given-names>A.</given-names></name> <name><surname>Saranti</surname> <given-names>A.</given-names></name> <name><surname>Molnar</surname> <given-names>C.</given-names></name> <name><surname>Biecek</surname> <given-names>P.</given-names></name> <name><surname>Samek</surname> <given-names>W.</given-names></name></person-group> (<year>2022</year>). <article-title>&#x0201C;Explainable ai methods-a brief overview,&#x0201D;</article-title> in <source>International Workshop on Extending Explainable AI Beyond Deep Models and Classifiers</source> (<publisher-loc>New York, NY</publisher-loc>: <publisher-name>Springer</publisher-name>), <fpage>13</fpage>&#x02013;<lpage>38</lpage>.</citation>
</ref>
<ref id="B92">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Houwer</surname> <given-names>J. D.</given-names></name></person-group> (<year>2019</year>). <article-title>Implicit bias is behavior: a functional-cognitive perspective on implicit bias</article-title>. <source>Perspect. Psychol. Sci</source>. <volume>14</volume>, <fpage>835</fpage>&#x02013;<lpage>840</lpage>. <pub-id pub-id-type="doi">10.1177/1745691619855638</pub-id><pub-id pub-id-type="pmid">31374177</pub-id></citation></ref>
<ref id="B93">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Huber</surname> <given-names>P. J.</given-names></name></person-group> (<year>2004</year>). <source>Robust Statistics, Vol. 523</source>. John Wiley &#x00026; Sons.</citation>
</ref>
<ref id="B94">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Hulsen</surname> <given-names>T.</given-names></name></person-group> (<year>2023</year>). <article-title>Explainable artificial intelligence (XAI): concepts and challenges in healthcare</article-title>. <source>AI</source> <volume>4</volume>, <fpage>652</fpage>&#x02013;<lpage>666</lpage>. <pub-id pub-id-type="doi">10.3390/ai4030034</pub-id></citation>
</ref>
<ref id="B95">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>John-Mathews</surname> <given-names>J.-M.</given-names></name></person-group> (<year>2022</year>). <article-title>Some critical and ethical perspectives on the empirical turn of AI interpretability</article-title>. <source>Technol. Forecast. Soc. Change</source> <volume>174</volume>:<fpage>121209</fpage>. <pub-id pub-id-type="doi">10.1016/j.techfore.2021.121209</pub-id></citation>
</ref>
<ref id="B96">
<citation citation-type="book"><person-group person-group-type="author"><name><surname>Kahn</surname> <given-names>K.</given-names></name> <name><surname>Winters</surname> <given-names>N.</given-names></name></person-group> (<year>2017</year>). <article-title>&#x0201C;Child-friendly programming interfaces to AI cloud services,&#x0201D;</article-title> in <source>12th European Conference on Technology Enhanced Learning</source> (<publisher-loc>New York, NY</publisher-loc>: <publisher-name>Springer</publisher-name>), <fpage>566</fpage>&#x02013;<lpage>570</lpage>.</citation>
</ref>
<ref id="B97">
<citation citation-type="book"><person-group person-group-type="author"><name><surname>Kaur</surname> <given-names>D.</given-names></name> <name><surname>Uslu</surname> <given-names>S.</given-names></name> <name><surname>Durresi</surname> <given-names>A.</given-names></name></person-group> (<year>2021</year>). <article-title>&#x0201C;Requirements for trustworthy artificial intelligence-a review,&#x0201D;</article-title> in <source>Advances in Networked-Based Information Systems: The 23rd International Conference on Network-Based Information Systems (NBiS-2020) 23</source> (<publisher-loc>New York, NY</publisher-loc>: <publisher-name>Springer</publisher-name>), <fpage>105</fpage>&#x02013;<lpage>115</lpage>.</citation>
</ref>
<ref id="B98">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Kaur</surname> <given-names>D.</given-names></name> <name><surname>Uslu</surname> <given-names>S.</given-names></name> <name><surname>Rittichier</surname> <given-names>K. J.</given-names></name> <name><surname>Durresi</surname> <given-names>A.</given-names></name></person-group> (<year>2022</year>). <article-title>Trustworthy artificial intelligence: a review</article-title>. <source>ACM Comp. Surv</source>. <volume>55</volume>, <fpage>1</fpage>&#x02013;<lpage>38</lpage>. <pub-id pub-id-type="doi">10.1145/3491209</pub-id></citation>
</ref>
<ref id="B99">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Kim</surname> <given-names>J.</given-names></name> <name><surname>Scott</surname> <given-names>C. D.</given-names></name></person-group> (<year>2012</year>). <article-title>Robust kernel density estimation</article-title>. <source>J. Mach. Learn. Res</source>. <volume>13</volume>, <fpage>2529</fpage>&#x02013;<lpage>2565</lpage>.</citation>
</ref>
<ref id="B100">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Kindermans</surname> <given-names>P.-J.</given-names></name> <name><surname>Hooker</surname> <given-names>S.</given-names></name> <name><surname>Adebayo</surname> <given-names>J.</given-names></name> <name><surname>Alber</surname> <given-names>M.</given-names></name> <name><surname>Sch&#x000FC;tt</surname> <given-names>K. T.</given-names></name> <name><surname>D&#x000E4;hne</surname> <given-names>S.</given-names></name> <etal/></person-group>. (<year>2019</year>). <article-title>&#x0201C;The (Un)reliability of saliency methods,&#x0201D;</article-title> in <source>Explainable AI: Interpreting, Explaining and Visualizing Deep Learning</source>, eds. W. Samek, G. Montavon, A. Vedaldi, L. K. Hansen, and K. R. M&#x000FC;ller (Cham: Springer International Publishing), <fpage>267</fpage>&#x02013;<lpage>280</lpage>.</citation>
</ref>
<ref id="B101">
<citation citation-type="book"><person-group person-group-type="author"><name><surname>Kohli</surname> <given-names>P.</given-names></name> <name><surname>Chadha</surname> <given-names>A.</given-names></name></person-group> (<year>2020</year>). <article-title>&#x0201C;Enabling pedestrian safety using computer vision techniques: a case study of the 2018 Uber Inc. self-driving car crash,&#x0201D;</article-title> in <source>Advances in Information and Communication: Proceedings of the 2019 Future of Information and Communication Conference (FICC), Volume 1</source> (<publisher-loc>New York, NY</publisher-loc>: <publisher-name>Springer</publisher-name>), <fpage>261</fpage>&#x02013;<lpage>279</lpage>.</citation>
</ref>
<ref id="B102">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Kokhlikyan</surname> <given-names>N.</given-names></name> <name><surname>Miglani</surname> <given-names>V.</given-names></name> <name><surname>Martin</surname> <given-names>M.</given-names></name> <name><surname>Wang</surname> <given-names>E.</given-names></name> <name><surname>Alsallakh</surname> <given-names>B.</given-names></name> <name><surname>Reynolds</surname> <given-names>J.</given-names></name> <etal/></person-group>. (<year>2020</year>). <article-title>Captum: a unified and generic model interpretability library for pytorch</article-title>. <source>arXiv</source> [preprint]. <pub-id pub-id-type="doi">10.48550/arXiv.2009.07896</pub-id></citation>
</ref>
<ref id="B103">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Koshiyama</surname> <given-names>A.</given-names></name> <name><surname>Kazim</surname> <given-names>E.</given-names></name> <name><surname>Treleaven</surname> <given-names>P.</given-names></name> <name><surname>Rai</surname> <given-names>P.</given-names></name> <name><surname>Szpruch</surname> <given-names>L.</given-names></name> <name><surname>Pavey</surname> <given-names>G.</given-names></name> <etal/></person-group>. (<year>2021</year>). <article-title>Towards algorithm auditing: a survey on managing legal, ethical and technological risks of ai, ml and associated algorithms</article-title>. <source>SSRN Electron. J</source>. <pub-id pub-id-type="doi">10.2139/ssrn.3778998</pub-id><pub-id pub-id-type="pmid">39076787</pub-id></citation></ref>
<ref id="B104">
<citation citation-type="book"><person-group person-group-type="author"><name><surname>Kowald</surname> <given-names>D.</given-names></name> <name><surname>Lacic</surname> <given-names>E.</given-names></name></person-group> (<year>2022</year>). <article-title>&#x0201C;Popularity bias in collaborative filtering-based multimedia recommender systems,&#x0201D;</article-title> in <source>International Workshop on Algorithmic Bias in Search and Recommendation</source> (<publisher-loc>New York, NY</publisher-loc>: <publisher-name>Springer</publisher-name>), <fpage>1</fpage>&#x02013;<lpage>11</lpage>.</citation>
</ref>
<ref id="B105">
<citation citation-type="book"><person-group person-group-type="author"><name><surname>Kowald</surname> <given-names>D.</given-names></name> <name><surname>Schedl</surname> <given-names>M.</given-names></name> <name><surname>Lex</surname> <given-names>E.</given-names></name></person-group> (<year>2020</year>). <article-title>&#x0201C;The unfairness of popularity bias in music recommendation: a reproducibility study,&#x0201D;</article-title> in <source>Advances in Information Retrieval: 42nd European Conference on IR Research, ECIR 2020, Lisbon, Portugal, April 14-17, 2020, Proceedings, Part II 42</source> (<publisher-loc>New York, NY</publisher-loc>: <publisher-name>Springer</publisher-name>), <fpage>35</fpage>&#x02013;<lpage>42</lpage>.</citation>
</ref>
<ref id="B106">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Krizhevsky</surname> <given-names>A.</given-names></name> <name><surname>Sutskever</surname> <given-names>I.</given-names></name> <name><surname>Hinton</surname> <given-names>G. E.</given-names></name></person-group> (<year>2012</year>). <article-title>Imagenet classification with deep convolutional neural networks</article-title>. <source>Adv. Neural Inf. Process. Syst</source>. 25. <pub-id pub-id-type="doi">10.1145/3065386</pub-id></citation>
</ref>
<ref id="B107">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Lazer</surname> <given-names>D.</given-names></name> <name><surname>Kennedy</surname> <given-names>R.</given-names></name> <name><surname>King</surname> <given-names>G.</given-names></name> <name><surname>Vespignani</surname> <given-names>A.</given-names></name></person-group> (<year>2014</year>). <article-title>The parable of google flu: traps in big data analysis</article-title>. <source>Science</source> <volume>343</volume>, <fpage>1203</fpage>&#x02013;<lpage>1205</lpage>. <pub-id pub-id-type="doi">10.1126/science.1248506</pub-id><pub-id pub-id-type="pmid">24626916</pub-id></citation></ref>
<ref id="B108">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>LeCun</surname> <given-names>Y.</given-names></name> <name><surname>Bengio</surname> <given-names>Y.</given-names></name> <name><surname>Hinton</surname> <given-names>G.</given-names></name></person-group> (<year>2015</year>). <article-title>Deep learning</article-title>. <source>Nature</source> <volume>521</volume>, <fpage>436</fpage>&#x02013;<lpage>444</lpage>. <pub-id pub-id-type="doi">10.1038/nature14539</pub-id><pub-id pub-id-type="pmid">26017442</pub-id></citation></ref>
<ref id="B109">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Lepri</surname> <given-names>B.</given-names></name> <name><surname>Oliver</surname> <given-names>N.</given-names></name> <name><surname>Letouz&#x000E9;</surname> <given-names>E.</given-names></name> <name><surname>Pentland</surname> <given-names>A.</given-names></name> <name><surname>Vinck</surname> <given-names>P.</given-names></name></person-group> (<year>2018</year>). <article-title>Fair, transparent, and accountable algorithmic decision-making processes: The premise, the proposed solutions, and the open challenges</article-title>. <source>Philos. Technol</source>. <volume>31</volume>, <fpage>611</fpage>&#x02013;<lpage>627</lpage>. <pub-id pub-id-type="doi">10.1007/s13347-017-0279-x</pub-id></citation>
</ref>
<ref id="B110">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Lewis</surname> <given-names>D.</given-names></name> <name><surname>Hogan</surname> <given-names>L.</given-names></name> <name><surname>Filip</surname> <given-names>D.</given-names></name> <name><surname>Wall</surname> <given-names>P. J.</given-names></name></person-group> (<year>2020</year>). <article-title>Global challenges in the standardization of ethics for trustworthy AI</article-title>. <source>J. ICT Standard</source>. <volume>8</volume>, <fpage>123</fpage>&#x02013;<lpage>150</lpage>. <pub-id pub-id-type="doi">10.13052/jicts2245-800X.823</pub-id><pub-id pub-id-type="pmid">31315747</pub-id></citation></ref>
<ref id="B111">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Li</surname> <given-names>B.</given-names></name> <name><surname>Qi</surname> <given-names>P.</given-names></name> <name><surname>Liu</surname> <given-names>B.</given-names></name> <name><surname>Di</surname> <given-names>S.</given-names></name> <name><surname>Liu</surname> <given-names>J.</given-names></name> <name><surname>Pei</surname> <given-names>J.</given-names></name> <etal/></person-group>. (<year>2023</year>). <article-title>Trustworthy AI: from principles to practices</article-title>. <source>ACM Comp. Surv</source>. <volume>55</volume>, <fpage>1</fpage>&#x02013;<lpage>46</lpage>. <pub-id pub-id-type="doi">10.1145/3555803</pub-id></citation>
</ref>
<ref id="B112">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Li</surname> <given-names>T.</given-names></name> <name><surname>Sahu</surname> <given-names>A. K.</given-names></name> <name><surname>Talwalkar</surname> <given-names>A.</given-names></name> <name><surname>Smith</surname> <given-names>V.</given-names></name></person-group> (<year>2020</year>). <article-title>Federated learning: challenges, methods, and future directions</article-title>. <source>IEEE Signal Process. Mag</source>. <volume>37</volume>, <fpage>50</fpage>&#x02013;<lpage>60</lpage>. <pub-id pub-id-type="doi">10.1109/MSP.2020.2975749</pub-id></citation>
</ref>
<ref id="B113">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Liang</surname> <given-names>W.</given-names></name> <name><surname>Tadesse</surname> <given-names>G. A.</given-names></name> <name><surname>Ho</surname> <given-names>D.</given-names></name> <name><surname>Fei-Fei</surname> <given-names>L.</given-names></name> <name><surname>Zaharia</surname> <given-names>M.</given-names></name> <name><surname>Zhang</surname> <given-names>C.</given-names></name> <etal/></person-group>. (<year>2022</year>). <article-title>Advances, challenges and opportunities in creating data for trustworthy AI</article-title>. <source>Nat. Mach. Intell</source>. <volume>4</volume>, <fpage>669</fpage>&#x02013;<lpage>677</lpage>. <pub-id pub-id-type="doi">10.1038/s42256-022-00516-1</pub-id><pub-id pub-id-type="pmid">39332994</pub-id></citation></ref>
<ref id="B114">
<citation citation-type="book"><person-group person-group-type="author"><name><surname>Liao</surname> <given-names>Q. V.</given-names></name> <name><surname>Gruen</surname> <given-names>D.</given-names></name> <name><surname>Miller</surname> <given-names>S.</given-names></name></person-group> (<year>2020</year>). <article-title>&#x0201C;Questioning the ai: informing design practices for explainable ai user experiences,&#x0201D;</article-title> in <source>Proceedings of the 2020 CHI Conference on Human Factors in Computing Systems</source> (<publisher-loc>New York, NY</publisher-loc>: <publisher-name>ACM</publisher-name>), <fpage>1</fpage>&#x02013;<lpage>15</lpage>.</citation>
</ref>
<ref id="B115">
<citation citation-type="book"><person-group person-group-type="author"><name><surname>Liu</surname> <given-names>F.</given-names></name> <name><surname>Cheng</surname> <given-names>Z.</given-names></name> <name><surname>Chen</surname> <given-names>H.</given-names></name> <name><surname>Wei</surname> <given-names>Y.</given-names></name> <name><surname>Nie</surname> <given-names>L.</given-names></name> <name><surname>Kankanhalli</surname> <given-names>M.</given-names></name></person-group> (<year>2022</year>). <article-title>&#x0201C;Privacy-preserving synthetic data generation for recommendation systems,&#x0201D;</article-title> in <source>Proceedings of the 45th International ACM SIGIR Conference on Research and Development in Information Retrieval</source> (<publisher-loc>New York, NY</publisher-loc>: <publisher-name>ACM</publisher-name>), <fpage>1379</fpage>&#x02013;<lpage>1389</lpage>.</citation>
</ref>
<ref id="B116">
<citation citation-type="book"><person-group person-group-type="author"><name><surname>Long</surname> <given-names>D.</given-names></name> <name><surname>Magerko</surname> <given-names>B.</given-names></name></person-group> (<year>2020</year>). <article-title>&#x0201C;What is ai literacy? competencies and design considerations,&#x0201D;</article-title> in <source>Proceedings of the 2020 CHI Conference on Human Factors in Computing Systems</source> (<publisher-loc>New York, NY</publisher-loc>: <publisher-name>ACM</publisher-name>), <fpage>1</fpage>&#x02013;<lpage>16</lpage>.</citation>
</ref>
<ref id="B117">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Lundberg</surname> <given-names>S. M.</given-names></name> <name><surname>Lee</surname> <given-names>S.-I.</given-names></name></person-group> (<year>2017</year>). <article-title>A unified approach to interpreting model predictions</article-title>. <source>Adv. Neural Inf. Process. Syst</source>. <volume>30</volume>, <fpage>4765</fpage>&#x02013;<lpage>4774</lpage>.</citation>
</ref>
<ref id="B118">
<citation citation-type="book"><person-group person-group-type="author"><name><surname>Madiega</surname> <given-names>T.</given-names></name></person-group> (<year>2021</year>). <source>Artificial intelligence Act</source>. <publisher-loc>Brussels</publisher-loc>: <publisher-name>European Parliament: European Parliamentary Research Service</publisher-name>.</citation>
</ref>
<ref id="B119">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>McDermid</surname> <given-names>J. A.</given-names></name> <name><surname>Jia</surname> <given-names>Y.</given-names></name> <name><surname>Porter</surname> <given-names>Z.</given-names></name> <name><surname>Habli</surname> <given-names>I.</given-names></name></person-group> (<year>2021</year>). <article-title>Artificial intelligence explainability: the technical and ethical dimensions</article-title>. <source>Philos. Transact. R. Soc. A</source> <volume>379</volume>:<fpage>20200363</fpage>. <pub-id pub-id-type="doi">10.1098/rsta.2020.0363</pub-id><pub-id pub-id-type="pmid">34398656</pub-id></citation></ref>
<ref id="B120">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>McGregor</surname> <given-names>L.</given-names></name> <name><surname>Murray</surname> <given-names>D.</given-names></name> <name><surname>Ng</surname> <given-names>V.</given-names></name></person-group> (<year>2019</year>). <article-title>International human rights law as a framework for algorithmic accountability</article-title>. <source>Int. Comp. Law Q</source>. <volume>68</volume>, <fpage>309</fpage>&#x02013;<lpage>343</lpage>. <pub-id pub-id-type="doi">10.1017/S0020589319000046</pub-id></citation>
</ref>
<ref id="B121">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Mehdiyev</surname> <given-names>N.</given-names></name> <name><surname>Fettke</surname> <given-names>P.</given-names></name></person-group> (<year>2021</year>). <article-title>Explainable artificial intelligence for process mining: a general overview and application of a novel local explanation approach for predictive process monitoring</article-title>. <source>Interpret. Artif. Intell</source>. <volume>937</volume>, <fpage>1</fpage>&#x02013;<lpage>28</lpage>. <pub-id pub-id-type="doi">10.1007/978-3-030-64949-4_1</pub-id></citation>
</ref>
<ref id="B122">
<citation citation-type="book"><person-group person-group-type="author"><name><surname>Mendoza</surname> <given-names>I. G.</given-names></name> <name><surname>Sabol</surname> <given-names>V.</given-names></name> <name><surname>Hoffer</surname> <given-names>J. G.</given-names></name></person-group> (<year>2023</year>). <article-title>&#x0201C;On the importance of user role-tailored explanations in industry 5.0,&#x0201D;</article-title> in <source>VISIGRAPP (2: HUCAPP)</source> (<publisher-loc>Set&#x000FA;bal</publisher-loc>: <publisher-name>SciTePress</publisher-name>), <fpage>243</fpage>&#x02013;<lpage>250</lpage>.</citation>
</ref>
<ref id="B123">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Miller</surname> <given-names>T.</given-names></name> <name><surname>Howe</surname> <given-names>P.</given-names></name> <name><surname>Sonenberg</surname> <given-names>L.</given-names></name></person-group> (<year>2017</year>). <article-title>Explainable AI: beware of inmates running the asylum or: How i learnt to stop worrying and love the social and behavioural sciences</article-title>. <source>arXiv</source> [preprint]. <pub-id pub-id-type="doi">10.48550/arXiv.1712.00547</pub-id></citation>
</ref>
<ref id="B124">
<citation citation-type="book"><person-group person-group-type="author"><name><surname>Molnar</surname> <given-names>C.</given-names></name></person-group> (<year>2020</year>). <source>Interpretable Machine Learning</source>. <publisher-loc>Lulu Press</publisher-loc>.</citation>
</ref>
<ref id="B125">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Montavon</surname> <given-names>G.</given-names></name> <name><surname>Samek</surname> <given-names>W.</given-names></name> <name><surname>M&#x000FC;ller</surname> <given-names>K.-R.</given-names></name></person-group> (<year>2018</year>). <article-title>Methods for interpreting and understanding deep neural networks</article-title>. <source>Digit. Signal Process</source>. <volume>73</volume>, <fpage>1</fpage>&#x02013;<lpage>15</lpage>. <pub-id pub-id-type="doi">10.1016/j.dsp.2017.10.011</pub-id></citation>
</ref>
<ref id="B126">
<citation citation-type="book"><person-group person-group-type="author"><name><surname>Moore</surname> <given-names>C.</given-names></name> <name><surname>O&#x00027;Neill</surname> <given-names>M.</given-names></name> <name><surname>O&#x00027;Sullivan</surname> <given-names>E.</given-names></name> <name><surname>Dor&#x000F6;z</surname> <given-names>Y.</given-names></name> <name><surname>Sunar</surname> <given-names>B.</given-names></name></person-group> (<year>2014</year>). <article-title>&#x0201C;Practical homomorphic encryption: a survey,&#x0201D;</article-title> in <source>2014 IEEE International Symposium on Circuits and Systems (ISCAS)</source> (<publisher-loc>New York, NY</publisher-loc>: <publisher-name>IEEE</publisher-name>), <fpage>2792</fpage>&#x02013;<lpage>2795</lpage>.</citation>
</ref>
<ref id="B127">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Moreira</surname> <given-names>C.</given-names></name> <name><surname>Chou</surname> <given-names>Y.-L.</given-names></name> <name><surname>Hsieh</surname> <given-names>C.</given-names></name> <name><surname>Ouyang</surname> <given-names>C.</given-names></name> <name><surname>Jorge</surname> <given-names>J.</given-names></name> <name><surname>Pereira</surname> <given-names>J. M.</given-names></name></person-group> (<year>2022</year>). <article-title>Benchmarking counterfactual algorithms for XAI: from white box to black box</article-title>. <source>arXiv</source> [preprint]. <pub-id pub-id-type="doi">10.48550/arXiv.2203.02399</pub-id></citation>
</ref>
<ref id="B128">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Mosqueira-Rey</surname> <given-names>E.</given-names></name> <name><surname>Hern&#x000E1;ndez-Pereira</surname> <given-names>E.</given-names></name> <name><surname>Alonso-R&#x000ED;os</surname> <given-names>D.</given-names></name> <name><surname>Bobes-Bascar&#x000E1;n</surname> <given-names>J.</given-names></name> <name><surname>Fern&#x000E1;ndez-Leal</surname> <given-names>&#x000C1;.</given-names></name></person-group> (<year>2023</year>). <article-title>Human-in-the-loop machine learning: a state of the art</article-title>. <source>Artif. Intell. Rev</source>. <volume>56</volume>, <fpage>3005</fpage>&#x02013;<lpage>3054</lpage>. <pub-id pub-id-type="doi">10.1007/s10462-022-10246-w</pub-id></citation>
</ref>
<ref id="B129">
<citation citation-type="web"><person-group person-group-type="author"><name><surname>Muandet</surname> <given-names>K.</given-names></name> <name><surname>Balduzzi</surname> <given-names>D.</given-names></name> <name><surname>Sch&#x000F6;lkopf</surname> <given-names>B.</given-names></name></person-group> (<year>2013</year>). <article-title>&#x0201C;Domain generalization via invariant feature representation,&#x0201D;</article-title> in <source>Proceedings of the 30th International Conference on International Conference on Machine Learning</source> - <italic>Volume 28, ICML&#x00027;13</italic> (<ext-link ext-link-type="uri" xlink:href="https://www.JMLR.org">JMLR.org</ext-link>.), <fpage>10</fpage>&#x02013;<lpage>18</lpage>.</citation>
</ref>
<ref id="B130">
<citation citation-type="book"><person-group person-group-type="author"><name><surname>Muellner</surname> <given-names>P.</given-names></name> <name><surname>Kowald</surname> <given-names>D.</given-names></name> <name><surname>Lex</surname> <given-names>E.</given-names></name></person-group> (<year>2021</year>). <article-title>&#x0201C;Robustness of meta matrix factorization against strict privacy constraints,&#x0201D;</article-title> in <source>Advances in Information Retrieval: 43rd European Conference on IR Research, ECIR 2021, Virtual Event, March 28-April 1, 2021, Proceedings, Part II 43</source> (<publisher-loc>New York, NY</publisher-loc>: <publisher-name>Springer</publisher-name>), <fpage>107</fpage>&#x02013;<lpage>119</lpage>.</citation>
</ref>
<ref id="B131">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>M&#x000FC;llner</surname> <given-names>P.</given-names></name> <name><surname>Lex</surname> <given-names>E.</given-names></name> <name><surname>Schedl</surname> <given-names>M.</given-names></name> <name><surname>Kowald</surname> <given-names>D.</given-names></name></person-group> (<year>2023</year>). <article-title>Differential privacy in collaborative filtering recommender systems: a review</article-title>. <source>Fron. Big Data</source> <volume>6</volume>:<fpage>1249997</fpage>. <pub-id pub-id-type="doi">10.3389/fdata.2023.1249997</pub-id><pub-id pub-id-type="pmid">37901117</pub-id></citation></ref>
<ref id="B132">
<citation citation-type="book"><person-group person-group-type="author"><name><surname>M&#x000FC;llner</surname> <given-names>P.</given-names></name> <name><surname>Lex</surname> <given-names>E.</given-names></name> <name><surname>Schedl</surname> <given-names>M.</given-names></name> <name><surname>Kowald</surname> <given-names>D.</given-names></name></person-group> (<year>2024</year>). <article-title>&#x0201C;The impact of differential privacy on recommendation accuracy and popularity bias,&#x0201D;</article-title> in <source>European Conference on Information Retrieval</source> (<publisher-loc>New York, NY</publisher-loc>: <publisher-name>Springer</publisher-name>), <fpage>466</fpage>&#x02013;<lpage>482</lpage>.</citation>
</ref>
<ref id="B133">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Munro</surname> <given-names>R.</given-names></name></person-group> (<year>2021</year>). <source>Human-in-the-Loop Machine Learning: Active Learning and Annotation for Human-Centered AI</source>. Manning.</citation>
</ref>
<ref id="B134">
<citation citation-type="book"><person-group person-group-type="author"><name><surname>Naidu</surname> <given-names>G.</given-names></name> <name><surname>Zuva</surname> <given-names>T.</given-names></name> <name><surname>Sibanda</surname> <given-names>E. M.</given-names></name></person-group> (<year>2023</year>). <article-title>&#x0201C;A review of evaluation metrics in machine learning algorithms,&#x0201D;</article-title> in <source>Computer Science On-line Conference</source> (<publisher-loc>New York, NY</publisher-loc>: <publisher-name>Springer</publisher-name>), <fpage>15</fpage>&#x02013;<lpage>25</lpage>.</citation>
</ref>
<ref id="B135">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Naiseh</surname> <given-names>M.</given-names></name> <name><surname>Al-Thani</surname> <given-names>D.</given-names></name> <name><surname>Jiang</surname> <given-names>N.</given-names></name> <name><surname>Ali</surname> <given-names>R.</given-names></name></person-group> (<year>2023</year>). <article-title>How the different explanation classes impact trust calibration: the case of clinical decision support systems</article-title>. <source>Int. J. Hum. Comput. Stud</source>. <volume>169</volume>:<fpage>102941</fpage>. <pub-id pub-id-type="doi">10.1016/j.ijhcs.2022.102941</pub-id></citation>
</ref>
<ref id="B136">
<citation citation-type="book"><person-group person-group-type="author"><name><surname>Nasr</surname> <given-names>M.</given-names></name> <name><surname>Shokri</surname> <given-names>R.</given-names></name> <name><surname>Houmansadr</surname> <given-names>A.</given-names></name></person-group> (<year>2019</year>). <article-title>&#x0201C;Comprehensive privacy analysis of deep learning: passive and active white-box inference attacks against centralized and federated learning,&#x0201D;</article-title> in <source>2019 IEEE Symposium on Security and Privacy (SP)</source> (<publisher-loc>New York, NY</publisher-loc>: <publisher-name>IEEE</publisher-name>), <fpage>739</fpage>&#x02013;<lpage>753</lpage>.</citation>
</ref>
<ref id="B137">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Nemani</surname> <given-names>P.</given-names></name> <name><surname>Joel</surname> <given-names>Y. D.</given-names></name> <name><surname>Vijay</surname> <given-names>P.</given-names></name> <name><surname>Liza</surname> <given-names>F. F.</given-names></name></person-group> (<year>2023</year>). <article-title>Gender bias in transformers: a comprehensive review of detection and mitigation strategies</article-title>. <source>Nat. Lang. Process. J</source>. <volume>6</volume>:<fpage>100047</fpage>. <pub-id pub-id-type="doi">10.1016/j.nlp.2023.100047</pub-id></citation>
</ref>
<ref id="B138">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Ng</surname> <given-names>D. T. K.</given-names></name> <name><surname>Leung</surname> <given-names>J. K. L.</given-names></name> <name><surname>Chu</surname> <given-names>S. K. W.</given-names></name> <name><surname>Qiao</surname> <given-names>M. S.</given-names></name></person-group> (<year>2021</year>). <article-title>Conceptualizing ai literacy: an exploratory review</article-title>. <source>Comp. Educ. Artif. Intell</source>. <volume>2</volume>:<fpage>100041</fpage>. <pub-id pub-id-type="doi">10.1016/j.caeai.2021.100041</pub-id></citation>
</ref>
<ref id="B139">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Nguyen</surname> <given-names>A.-P.</given-names></name> <name><surname>Mart&#x000ED;nez</surname> <given-names>M. R.</given-names></name></person-group> (<year>2020</year>). <article-title>On quantitative aspects of model interpretability</article-title>. <source>arXiv</source> [preprint]. <pub-id pub-id-type="doi">10.48550/arXiv.2007.07584</pub-id></citation>
</ref>
<ref id="B140">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Nicolae</surname> <given-names>M.-I.</given-names></name> <name><surname>Sinn</surname> <given-names>M.</given-names></name> <name><surname>Tran</surname> <given-names>M. N.</given-names></name> <name><surname>Buesser</surname> <given-names>B.</given-names></name> <name><surname>Rawat</surname> <given-names>A.</given-names></name> <name><surname>Wistuba</surname> <given-names>M.</given-names></name> <etal/></person-group>. (<year>2019</year>). <article-title>Adversarial robustness Toolbox v1.0.0</article-title>. <source>arXiv</source> [prepront]. <pub-id pub-id-type="doi">10.48550/arXiv.1807.01069</pub-id></citation>
</ref>
<ref id="B141">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Novelli</surname> <given-names>C.</given-names></name> <name><surname>Taddeo</surname> <given-names>M.</given-names></name> <name><surname>Floridi</surname> <given-names>L.</given-names></name></person-group> (<year>2023</year>). <article-title>Accountability in artificial intelligence: what it is and how it works</article-title>. <source>AI Soc</source>. <volume>39</volume>, <fpage>1</fpage>&#x02013;<lpage>12</lpage>. <pub-id pub-id-type="doi">10.2139/ssrn.4180366</pub-id></citation>
</ref>
<ref id="B142">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Ntoutsi</surname> <given-names>E.</given-names></name> <name><surname>Fafalios</surname> <given-names>P.</given-names></name> <name><surname>Gadiraju</surname> <given-names>U.</given-names></name> <name><surname>Iosifidis</surname> <given-names>V.</given-names></name> <name><surname>Nejdl</surname> <given-names>W.</given-names></name> <name><surname>Vidal</surname> <given-names>M.-E.</given-names></name> <etal/></person-group>. (<year>2020</year>). <article-title>Bias in data-driven artificial intelligence systems&#x02014;an introductory survey</article-title>. <source>Wiley Interdiscip. Rev</source>. <volume>10</volume>:<fpage>e1356</fpage>. <pub-id pub-id-type="doi">10.1002/widm.1356</pub-id></citation>
</ref>
<ref id="B143">
<citation citation-type="book"><person-group person-group-type="author"><name><surname>Nushi</surname> <given-names>B.</given-names></name> <name><surname>Kamar</surname> <given-names>E.</given-names></name> <name><surname>Horvitz</surname> <given-names>E.</given-names></name></person-group> (<year>2018</year>). <article-title>&#x0201C;Towards accountable AI: hybrid human-machine analyses for characterizing system failure,&#x0201D;</article-title> in <source>Proceedings of the AAAI Conference on Human Computation and Crowdsourcing, Vol. 6</source> (<publisher-loc>Washington, DC</publisher-loc>: <publisher-name>AAAI Press</publisher-name>), <fpage>126</fpage>&#x02013;<lpage>135</lpage>.</citation>
</ref>
<ref id="B144">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Pammer-Schindler</surname> <given-names>V.</given-names></name> <name><surname>Lindstaedt</surname> <given-names>S.</given-names></name></person-group> (<year>2022</year>). <article-title>AI literacy f"ur entscheidungstr&#x000E4;gerinnen im strategischen management</article-title>. <source>Wirtschaftsinformatik Manag</source>. <volume>14</volume>, <fpage>140</fpage>&#x02013;<lpage>143</lpage>. <pub-id pub-id-type="doi">10.1365/s35764-022-00399-2</pub-id></citation>
</ref>
<ref id="B145">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Pedregosa</surname> <given-names>F.</given-names></name> <name><surname>Varoquaux</surname> <given-names>G.</given-names></name> <name><surname>Gramfort</surname> <given-names>A.</given-names></name> <name><surname>Michel</surname> <given-names>V.</given-names></name> <name><surname>Thirion</surname> <given-names>B.</given-names></name> <name><surname>Grisel</surname> <given-names>O.</given-names></name> <etal/></person-group>. (<year>2011</year>). <article-title>scikit-learn: machine learning in Python</article-title>. <source>J. Mach. Learn. Res</source>. <volume>12</volume>, <fpage>2825</fpage>&#x02013;<lpage>2830</lpage>.</citation>
</ref>
<ref id="B146">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Pendleton</surname> <given-names>M.</given-names></name> <name><surname>Garcia-Lebron</surname> <given-names>R.</given-names></name> <name><surname>Cho</surname> <given-names>J.-H.</given-names></name> <name><surname>Xu</surname> <given-names>S.</given-names></name></person-group> (<year>2016</year>). <article-title>A survey on systems security metrics</article-title>. <source>ACM Comp. Surv</source>. <volume>49</volume>, <fpage>1</fpage>&#x02013;<lpage>35</lpage>. <pub-id pub-id-type="doi">10.1145/3005714</pub-id></citation>
</ref>
<ref id="B147">
<citation citation-type="book"><person-group person-group-type="author"><name><surname>Pessach</surname> <given-names>D.</given-names></name> <name><surname>Shmueli</surname> <given-names>E.</given-names></name></person-group> (<year>2023</year>). <article-title>&#x0201C;Algorithmic fairness,&#x0201D;</article-title> in <source>Machine Learning for Data Science Handbook: Data Mining and Knowledge Discovery Handbook</source> (<publisher-loc>New York, NY</publisher-loc>: <publisher-name>Springer</publisher-name>), <fpage>867</fpage>&#x02013;<lpage>886</lpage>.</citation>
</ref>
<ref id="B148">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Phong</surname> <given-names>L. T.</given-names></name> <name><surname>Aono</surname> <given-names>Y.</given-names></name> <name><surname>Hayashi</surname> <given-names>T.</given-names></name> <name><surname>Wang</surname> <given-names>L.</given-names></name> <name><surname>Moriai</surname> <given-names>S.</given-names></name></person-group> (<year>2018</year>). <article-title>Privacy-preserving deep learning via additively homomorphic encryption</article-title>. <source>IEEE Trans. Inf. Forensics Secur</source>. <volume>13</volume>, <fpage>1333</fpage>&#x02013;<lpage>1345</lpage>. <pub-id pub-id-type="doi">10.1109/TIFS.2017.2787987</pub-id></citation>
</ref>
<ref id="B149">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Pleiss</surname> <given-names>G.</given-names></name> <name><surname>Raghavan</surname> <given-names>M.</given-names></name> <name><surname>Wu</surname> <given-names>F.</given-names></name> <name><surname>Kleinberg</surname> <given-names>J.</given-names></name> <name><surname>Weinberger</surname> <given-names>K. Q.</given-names></name></person-group> (<year>2017</year>). <article-title>On fairness and calibration</article-title>. <source>Adv. Neural Inf. Process. Syst</source>. 30.</citation>
</ref>
<ref id="B150">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Poretschkin</surname> <given-names>M.</given-names></name> <name><surname>Schmitz</surname> <given-names>A.</given-names></name> <name><surname>Akila</surname> <given-names>M.</given-names></name> <name><surname>Adilova</surname> <given-names>L.</given-names></name> <name><surname>Becker</surname> <given-names>D.</given-names></name> <name><surname>Cremers</surname> <given-names>A. B.</given-names></name> <etal/></person-group>. (<year>2023</year>). <article-title>Guideline for trustworthy artificial intelligence-ai assessment catalog</article-title>. <source>arXiv</source> [preprint]. <pub-id pub-id-type="doi">10.48550/arXiv.2307.03681</pub-id></citation>
</ref>
<ref id="B151">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Radclyffe</surname> <given-names>C.</given-names></name> <name><surname>Ribeiro</surname> <given-names>M.</given-names></name> <name><surname>Wortham</surname> <given-names>R. H.</given-names></name></person-group> (<year>2023</year>). <article-title>The assessment list for trustworthy artificial intelligence: a review and recommendations</article-title>. <source>Front. Artif. Intell</source>. <volume>6</volume>:<fpage>1020592</fpage>. <pub-id pub-id-type="doi">10.3389/frai.2023.1020592</pub-id><pub-id pub-id-type="pmid">36967834</pub-id></citation></ref>
<ref id="B152">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Rajpurkar</surname> <given-names>P.</given-names></name> <name><surname>Chen</surname> <given-names>E.</given-names></name> <name><surname>Banerjee</surname> <given-names>O.</given-names></name> <name><surname>Topol</surname> <given-names>E. J.</given-names></name></person-group> (<year>2022</year>). <article-title>AI in health and medicine</article-title>. <source>Nat. Med</source>. <volume>28</volume>, <fpage>31</fpage>&#x02013;<lpage>38</lpage>. <pub-id pub-id-type="doi">10.1038/s41591-021-01614-0</pub-id><pub-id pub-id-type="pmid">35058619</pub-id></citation></ref>
<ref id="B153">
<citation citation-type="book"><person-group person-group-type="author"><name><surname>Rechberger</surname> <given-names>C.</given-names></name> <name><surname>Walch</surname> <given-names>R.</given-names></name></person-group> (<year>2022</year>). <article-title>&#x0201C;Privacy-preserving machine learning using cryptography,&#x0201D;</article-title> in <source>Security and Artificial Intelligence</source> (<publisher-loc>New York, NY</publisher-loc>: <publisher-name>Springer</publisher-name>), <fpage>109</fpage>&#x02013;<lpage>129</lpage>.</citation>
</ref>
<ref id="B154">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Ren</surname> <given-names>H.</given-names></name> <name><surname>Deng</surname> <given-names>J.</given-names></name> <name><surname>Xie</surname> <given-names>X.</given-names></name></person-group> (<year>2022</year>). <article-title>Grnn: generative regression neural network&#x02014;a data leakage attack for federated learning. <italic>ACM Transact. Intell. Systems</italic></article-title>. <source>Technol</source>. <volume>13</volume>, <fpage>1</fpage>&#x02013;<lpage>24</lpage>. <pub-id pub-id-type="doi">10.1145/3510032</pub-id></citation>
</ref>
<ref id="B155">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Ribeiro</surname> <given-names>M. T.</given-names></name> <name><surname>Singh</surname> <given-names>S.</given-names></name> <name><surname>Guestrin</surname> <given-names>C.</given-names></name></person-group> (<year>2016</year>). &#x0201C;Why should i trust you?&#x0201D; Explaining the predictions of any classifier,&#x0201D; in <italic>Proceedings of the 22nd ACM SIGKDD International Conference on Knowledge Discovery and Data Mining</italic> (New York, NY: ACM), <fpage>1135</fpage>&#x02013;<lpage>1144</lpage>.</citation>
</ref>
<ref id="B156">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Righetti</surname> <given-names>L.</given-names></name> <name><surname>Madhavan</surname> <given-names>R.</given-names></name> <name><surname>Chatila</surname> <given-names>R.</given-names></name></person-group> (<year>2019</year>). <article-title>Unintended consequences of biased robotic and artificial intelligence systems [ethical, legal, and societal issues]</article-title>. <source>IEEE Robot. Automat. Mag</source>. <volume>26</volume>, <fpage>11</fpage>&#x02013;<lpage>13</lpage>. <pub-id pub-id-type="doi">10.1109/MRA.2019.2926996</pub-id></citation>
</ref>
<ref id="B157">
<citation citation-type="book"><person-group person-group-type="author"><name><surname>Roy</surname> <given-names>D.</given-names></name> <name><surname>Murty</surname> <given-names>K. R.</given-names></name> <name><surname>Mohan</surname> <given-names>C. K.</given-names></name></person-group> (<year>2015</year>). <article-title>&#x0201C;Feature selection using deep neural networks,&#x0201D;</article-title> in <source>2015 International Joint Conference on Neural Networks (IJCNN)</source> (<publisher-loc>New York, NY</publisher-loc>: <publisher-name>IEEE</publisher-name>), <fpage>1</fpage>&#x02013;<lpage>6</lpage>.</citation>
</ref>
<ref id="B158">
<citation citation-type="book"><person-group person-group-type="author"><name><surname>Rusak</surname> <given-names>E.</given-names></name> <name><surname>Schott</surname> <given-names>L.</given-names></name> <name><surname>Zimmermann</surname> <given-names>R. S.</given-names></name> <name><surname>Bitterwolf</surname> <given-names>J.</given-names></name> <name><surname>Bringmann</surname> <given-names>O.</given-names></name> <name><surname>Bethge</surname> <given-names>M.</given-names></name> <etal/></person-group>. (<year>2020</year>). <article-title>&#x0201C;A simple way to make neural networks robust against diverse image corruptions,&#x0201D;</article-title> in <source>European Conference on Computer Vision</source> (<publisher-loc>New York, NY</publisher-loc>: <publisher-name>Springer</publisher-name>), <fpage>53</fpage>&#x02013;<lpage>69</lpage>.</citation>
</ref>
<ref id="B159">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Saleiro</surname> <given-names>P.</given-names></name> <name><surname>Kuester</surname> <given-names>B.</given-names></name> <name><surname>Hinkson</surname> <given-names>L.</given-names></name> <name><surname>London</surname> <given-names>J.</given-names></name> <name><surname>Stevens</surname> <given-names>A.</given-names></name> <name><surname>Anisfeld</surname> <given-names>A.</given-names></name> <etal/></person-group>. (<year>2018</year>). <article-title>Aequitas: a bias and fairness audit toolkit</article-title>. <source>arXiv</source> [preprint]. <pub-id pub-id-type="doi">10.48550/arXiv.1811.05577</pub-id></citation>
</ref>
<ref id="B160">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Samek</surname> <given-names>W.</given-names></name> <name><surname>Binder</surname> <given-names>A.</given-names></name> <name><surname>Montavon</surname> <given-names>G.</given-names></name> <name><surname>Lapuschkin</surname> <given-names>S.</given-names></name> <name><surname>M&#x000FC;ller</surname> <given-names>K.-R.</given-names></name></person-group> (<year>2016</year>). <article-title>Evaluating the visualization of what a deep neural network has learned</article-title>. <source>IEEE Transact. Neural Netw. Learn. Syst</source>. <volume>28</volume>, <fpage>2660</fpage>&#x02013;<lpage>2673</lpage>. <pub-id pub-id-type="doi">10.1109/TNNLS.2016.2599820</pub-id><pub-id pub-id-type="pmid">27576267</pub-id></citation></ref>
<ref id="B161">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Samek</surname> <given-names>W.</given-names></name> <name><surname>Montavon</surname> <given-names>G.</given-names></name> <name><surname>Lapuschkin</surname> <given-names>S.</given-names></name> <name><surname>Anders</surname> <given-names>C. J.</given-names></name> <name><surname>M&#x000FC;ller</surname> <given-names>K.-R.</given-names></name></person-group> (<year>2021</year>). <article-title>Explaining deep neural networks and beyond: a review of methods and applications</article-title>. <source>Proc. IEEE</source> <volume>109</volume>, <fpage>247</fpage>&#x02013;<lpage>278</lpage>. <pub-id pub-id-type="doi">10.1109/JPROC.2021.3060483</pub-id></citation>
</ref>
<ref id="B162">
<citation citation-type="book"><person-group person-group-type="author"><name><surname>Saxena</surname> <given-names>N. A.</given-names></name></person-group> (<year>2019</year>). <article-title>&#x0201C;Perceptions of fairness,&#x0201D;</article-title> in <source>Proceedings of the 2019 AAAI/ACM Conference on AI, Ethics, and Society</source> (<publisher-loc>New York, NY</publisher-loc>: <publisher-name>AAAI; ACM</publisher-name>), <fpage>537</fpage>&#x02013;<lpage>538</lpage>.</citation>
</ref>
<ref id="B163">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Scher</surname> <given-names>S.</given-names></name> <name><surname>Tr&#x000FC;gler</surname> <given-names>A.</given-names></name></person-group> (<year>2023</year>). <article-title>Testing robustness of predictions of trained classifiers against naturally occurring perturbations</article-title>. <source>arXiv</source> [preprint]. <pub-id pub-id-type="doi">10.48550/arXiv.2204.10046</pub-id><pub-id pub-id-type="pmid">27534393</pub-id></citation></ref>
<ref id="B164">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Schneider</surname> <given-names>J.</given-names></name></person-group> (<year>2024</year>). <article-title>Explainable generative AI (genXAI): a survey, conceptualization, and research agenda</article-title>. <source>Artif. Intell. Rev</source>. <volume>57</volume>:<fpage>289</fpage>. <pub-id pub-id-type="doi">10.1007/s10462-024-10916-x</pub-id></citation>
</ref>
<ref id="B165">
<citation citation-type="book"><person-group person-group-type="author"><name><surname>Selvaraju</surname> <given-names>R. R.</given-names></name> <name><surname>Cogswell</surname> <given-names>M.</given-names></name> <name><surname>Das</surname> <given-names>A.</given-names></name> <name><surname>Vedantam</surname> <given-names>R.</given-names></name> <name><surname>Parikh</surname> <given-names>D.</given-names></name> <name><surname>Batra</surname> <given-names>D.</given-names></name></person-group> (<year>2017</year>). <article-title>&#x0201C;Grad-CAM: visual explanations from deep networks via gradient-based localization,&#x0201D;</article-title> in <source>Proceedings of the IEEE International Conference on Computer Vision (ICCV)</source> (<publisher-loc>New York, NY</publisher-loc>: <publisher-name>IEEE</publisher-name>), <fpage>618</fpage>&#x02013;<lpage>626</lpage>.</citation>
</ref>
<ref id="B166">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Seyyed-Kalantari</surname> <given-names>L.</given-names></name> <name><surname>Zhang</surname> <given-names>H.</given-names></name> <name><surname>McDermott</surname> <given-names>M. B.</given-names></name> <name><surname>Chen</surname> <given-names>I. Y.</given-names></name> <name><surname>Ghassemi</surname> <given-names>M.</given-names></name></person-group> (<year>2021</year>). <article-title>Underdiagnosis bias of artificial intelligence algorithms applied to chest radiographs in under-served patient populations</article-title>. <source>Nat. Med</source>. <volume>27</volume>, <fpage>2176</fpage>&#x02013;<lpage>2182</lpage>. <pub-id pub-id-type="doi">10.1038/s41591-021-01595-0</pub-id><pub-id pub-id-type="pmid">34893776</pub-id></citation></ref>
<ref id="B167">
<citation citation-type="book"><person-group person-group-type="author"><name><surname>Sharma</surname> <given-names>S.</given-names></name> <name><surname>Henderson</surname> <given-names>J.</given-names></name> <name><surname>Ghosh</surname> <given-names>J.</given-names></name></person-group> (<year>2020</year>). <article-title>&#x0201C;CERTIFAI: a common framework to provide explanations and analyse the fairness and robustness of black-box models,&#x0201D;</article-title> in <source>Proceedings of the AAAI/ACM Conference on AI, Ethics, and Society</source> (<publisher-loc>New York, NY</publisher-loc>: <publisher-name>ACM</publisher-name>), <fpage>166</fpage>&#x02013;<lpage>172</lpage>.</citation>
</ref>
<ref id="B168">
<citation citation-type="book"><person-group person-group-type="author"><name><surname>Shrikumar</surname> <given-names>A.</given-names></name> <name><surname>Greenside</surname> <given-names>P.</given-names></name> <name><surname>Kundaje</surname> <given-names>A.</given-names></name></person-group> (<year>2017</year>). <article-title>&#x0201C;Learning important features through propagating activation differences,&#x0201D;</article-title> in <source>International Conference on Machine Learning</source> (<publisher-loc>New York, NY</publisher-loc>: <publisher-name>PMLR</publisher-name>), <fpage>3145</fpage>&#x02013;<lpage>3153</lpage>.</citation>
</ref>
<ref id="B169">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>&#x00160;imi&#x00107;</surname> <given-names>I.</given-names></name> <name><surname>Sabol</surname> <given-names>V.</given-names></name> <name><surname>Veas</surname> <given-names>E.</given-names></name></person-group> (<year>2022</year>). <article-title>&#x0201C;Perturbation effect: a metric to counter misleading validation of feature attribution,&#x0201D;</article-title> in <source>Proceedings of the 31st ACM International Conference on Information</source> &#x00026; <italic>Knowledge Management</italic> (New York, NY: ACM), <fpage>1798</fpage>&#x02013;<lpage>1807</lpage>.</citation>
</ref>
<ref id="B170">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Simkute</surname> <given-names>A.</given-names></name> <name><surname>Tankelevitch</surname> <given-names>L.</given-names></name> <name><surname>Kewenig</surname> <given-names>V.</given-names></name> <name><surname>Scott</surname> <given-names>A. E.</given-names></name> <name><surname>Sellen</surname> <given-names>A.</given-names></name> <name><surname>Rintel</surname> <given-names>S.</given-names></name></person-group> (<year>2024</year>). <article-title>Ironies of generative AI: understanding and mitigating productivity loss in human-ai interactions</article-title>. <source>arXiv</source> [preprint]. <pub-id pub-id-type="doi">10.1080/10447318.2024.2405782</pub-id></citation>
</ref>
<ref id="B171">
<citation citation-type="book"><person-group person-group-type="author"><name><surname>Slokom</surname> <given-names>M.</given-names></name></person-group> (<year>2018</year>). <article-title>&#x0201C;Comparing recommender systems using synthetic data,&#x0201D;</article-title> in <source>Proceedings of the 12th ACM Conference on Recommender Systems</source> (<publisher-loc>New York, NY</publisher-loc>: <publisher-name>ACM</publisher-name>), <fpage>548</fpage>&#x02013;<lpage>552</lpage>.</citation>
</ref>
<ref id="B172">
<citation citation-type="book"><person-group person-group-type="author"><name><surname>Smart</surname> <given-names>N. P.</given-names></name></person-group> (<year>2016</year>). <source>Cryptography Made Simple. Information Security and Cryptography</source>. <publisher-loc>New York, NY</publisher-loc>: <publisher-name>Springer</publisher-name>.</citation>
</ref>
<ref id="B173">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Smuha</surname> <given-names>N. A.</given-names></name></person-group> (<year>2019</year>). <article-title>The eu approach to ethics guidelines for trustworthy artificial intelligence</article-title>. <source>Comp. Law Rev. Int</source>. <volume>20</volume>, <fpage>97</fpage>&#x02013;<lpage>106</lpage>. <pub-id pub-id-type="doi">10.9785/cri-2019-200402</pub-id></citation>
</ref>
<ref id="B174">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Snyder</surname> <given-names>H.</given-names></name></person-group> (<year>2019</year>). <article-title>Literature review as a research methodology: an overview and guidelines</article-title>. <source>J. Bus. Res</source>. <volume>104</volume>, <fpage>333</fpage>&#x02013;<lpage>339</lpage>. <pub-id pub-id-type="doi">10.1016/j.jbusres.2019.07.039</pub-id></citation>
</ref>
<ref id="B175">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Srivastava</surname> <given-names>M.</given-names></name> <name><surname>Heidari</surname> <given-names>H.</given-names></name> <name><surname>Krause</surname> <given-names>A.</given-names></name></person-group> (<year>2019</year>). <article-title>&#x0201C;Mathematical notions vs. human perception of fairness: a descriptive approach to fairness for machine learning,&#x0201D;</article-title> in <source>Proceedings of the 25th ACM SIGKDD International Conference on Knowledge Discovery</source> &#x00026; <italic>Data Mining</italic> (New York, NY: ACM), <fpage>2459</fpage>&#x02013;<lpage>2468</lpage>.</citation>
</ref>
<ref id="B176">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Stadler</surname> <given-names>T.</given-names></name> <name><surname>Oprisanu</surname> <given-names>B.</given-names></name> <name><surname>Troncoso</surname> <given-names>C.</given-names></name></person-group> (<year>2022</year>). <article-title>&#x0201C;Synthetic data - anonymisation groundhog day,&#x0201D;</article-title> in <source>31st USENIX Security Symposium, USENIX Security 2022</source>, eds. K. T. B. Butler, and K. Thomas (Boston, MA: USENIX Association), 1451-1468.</citation>
</ref>
<ref id="B177">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Stix</surname> <given-names>C.</given-names></name></person-group> (<year>2021</year>). <article-title>Actionable principles for artificial intelligence policy: three pathways</article-title>. <source>Sci. Eng. Ethics</source> 27L15. <pub-id pub-id-type="doi">10.1007/s11948-020-00277-3</pub-id><pub-id pub-id-type="pmid">33608756</pub-id></citation></ref>
<ref id="B178">
<citation citation-type="book"><person-group person-group-type="author"><name><surname>Sundararajan</surname> <given-names>M.</given-names></name> <name><surname>Taly</surname> <given-names>A.</given-names></name> <name><surname>Yan</surname> <given-names>Q.</given-names></name></person-group> (<year>2017</year>). <article-title>&#x0201C;Axiomatic attribution for deep networks,&#x0201D;</article-title> in <source>International Conference on Machine Learning</source> (<publisher-loc>PMLR</publisher-loc>), <fpage>3319</fpage>&#x02013;<lpage>3328</lpage>.</citation>
</ref>
<ref id="B179">
<citation citation-type="book"><person-group person-group-type="author"><name><surname>Tagiou</surname> <given-names>E.</given-names></name> <name><surname>Kanellopoulos</surname> <given-names>Y.</given-names></name> <name><surname>Aridas</surname> <given-names>C.</given-names></name> <name><surname>Makris</surname> <given-names>C.</given-names></name></person-group> (<year>2019</year>). <article-title>&#x0201C;A tool supported framework for the assessment of algorithmic accountability,&#x0201D;</article-title> in <source>2019 10th International Conference on Information, Intelligence, Systems and Applications (IISA)</source> (<publisher-loc>New York, NY</publisher-loc>: <publisher-name>IEEE</publisher-name>), <fpage>1</fpage>&#x02013;<lpage>9</lpage>.<pub-id pub-id-type="pmid">6563201</pub-id></citation></ref>
<ref id="B180">
<citation citation-type="book"><person-group person-group-type="author"><name><surname>Tai</surname> <given-names>B.</given-names></name> <name><surname>Li</surname> <given-names>S.</given-names></name> <name><surname>Huang</surname> <given-names>Y.</given-names></name> <name><surname>Wang</surname> <given-names>P.</given-names></name></person-group> (<year>2022</year>). <article-title>&#x0201C;Examining the utility of differentially private synthetic data generated using variational autoencoder with tensorflow privacy,&#x0201D;</article-title> in <source>27th IEEE Pacific Rim International Symposium on Dependable Computing, PRDC 2022</source> (<publisher-loc>Beijing</publisher-loc>: <publisher-name>IEEE</publisher-name>), <fpage>236</fpage>&#x02013;<lpage>241</lpage>.</citation>
</ref>
<ref id="B181">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Thiebes</surname> <given-names>S.</given-names></name> <name><surname>Lins</surname> <given-names>S.</given-names></name> <name><surname>Sunyaev</surname> <given-names>A.</given-names></name></person-group> (<year>2021</year>). <article-title>Trustworthy artificial intelligence</article-title>. <source>Electron. Mark</source>. <volume>31</volume>, <fpage>447</fpage>&#x02013;<lpage>464</lpage>. <pub-id pub-id-type="doi">10.1007/s12525-020-00441-4</pub-id></citation>
</ref>
<ref id="B182">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Toth</surname> <given-names>Z.</given-names></name> <name><surname>Caruana</surname> <given-names>R.</given-names></name> <name><surname>Gruber</surname> <given-names>T.</given-names></name> <name><surname>Loebbecke</surname> <given-names>C.</given-names></name></person-group> (<year>2022</year>). <article-title>The dawn of the ai robots: towards a new framework of ai robot accountability</article-title>. <source>J. Bus. Ethics</source> <volume>178</volume>, <fpage>895</fpage>&#x02013;<lpage>916</lpage>. <pub-id pub-id-type="doi">10.1007/s10551-022-05050-z</pub-id></citation>
</ref>
<ref id="B183">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Van den Broek</surname> <given-names>E.</given-names></name> <name><surname>Sergeeva</surname> <given-names>A.</given-names></name> <name><surname>Huysman</surname> <given-names>M.</given-names></name></person-group> (<year>2021</year>). <article-title>When the machine meets the expert: an ethnography of developing ai for hiring</article-title>. <source>MIS Q</source>. <volume>45</volume>:<fpage>16559</fpage>. <pub-id pub-id-type="doi">10.25300/MISQ/2021/16559</pub-id></citation>
</ref>
<ref id="B184">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Vasudevan</surname> <given-names>S.</given-names></name> <name><surname>Kenthapadi</surname> <given-names>K.</given-names></name></person-group> (<year>2020</year>). <article-title>&#x0201C;Lift: a scalable framework for measuring fairness in ml applications,&#x0201D;</article-title> in <source>Proceedings of the 29th ACM International Conference on Information</source> &#x00026; <italic>Knowledge Management</italic> (New York, NY: ACM), <fpage>2773</fpage>&#x02013;<lpage>2780</lpage>.</citation>
</ref>
<ref id="B185">
<citation citation-type="book"><person-group person-group-type="author"><name><surname>Verma</surname> <given-names>S.</given-names></name> <name><surname>Julia</surname> <given-names>R.</given-names></name></person-group> (<year>2018</year>). <article-title>&#x0201C;Fairness definitions explained,&#x0201D;</article-title> in <source>Proceedings of the International Workshop on Software Fairness (FairWare&#x00027;18)</source> (<publisher-loc>ACM</publisher-loc>), <fpage>1</fpage>&#x02013;<lpage>7</lpage>.</citation>
</ref>
<ref id="B186">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Wachter</surname> <given-names>S.</given-names></name> <name><surname>Mittelstadt</surname> <given-names>B.</given-names></name> <name><surname>Russell</surname> <given-names>C.</given-names></name></person-group> (<year>2021</year>). <article-title>Why fairness cannot be automated: bridging the gap between eu non-discrimination law and AI</article-title>. <source>Comp. Law Sec. Rev</source>. <volume>41</volume>:<fpage>105567</fpage>. <pub-id pub-id-type="doi">10.1016/j.clsr.2021.105567</pub-id></citation>
</ref>
<ref id="B187">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Wagner</surname> <given-names>I.</given-names></name> <name><surname>Eckhoff</surname> <given-names>D.</given-names></name></person-group> (<year>2018</year>). <article-title>Technical privacy metrics: a systematic survey</article-title>. <source>ACM Comp. Surv</source>. <volume>51</volume>, <fpage>1</fpage>&#x02013;<lpage>38</lpage>. <pub-id pub-id-type="doi">10.1145/3168389</pub-id></citation>
</ref>
<ref id="B188">
<citation citation-type="book"><person-group person-group-type="author"><name><surname>Wang</surname> <given-names>B. Y.</given-names></name> <name><surname>Boell</surname> <given-names>S. K.</given-names></name> <name><surname>Riemer</surname> <given-names>K.</given-names></name> <name><surname>Peter</surname> <given-names>S.</given-names></name></person-group> (<year>2023</year>). <article-title>&#x0201C;Human agency in ai configurations supporting organizational decision-making,&#x0201D;</article-title> in <source>ACIS 2023 Proceedings</source> (<publisher-loc>Atlanta, GA:AIS</publisher-loc>), <fpage>1</fpage>&#x02013;<lpage>22</lpage>.</citation>
</ref>
<ref id="B189">
<citation citation-type="book"><person-group person-group-type="author"><name><surname>Wang</surname> <given-names>D.</given-names></name> <name><surname>Yang</surname> <given-names>Q.</given-names></name> <name><surname>Abdul</surname> <given-names>A.</given-names></name> <name><surname>Lim</surname> <given-names>B. Y.</given-names></name></person-group> (<year>2019</year>). <article-title>&#x0201C;Designing theory-driven user-centric explainable AI,&#x0201D;</article-title> in <source>Proceedings of the 2019 CHI Conference on Human Factors in Computing Systems</source> (<publisher-loc>New York, NY</publisher-loc>: <publisher-name>ACM</publisher-name>), <fpage>1</fpage>&#x02013;<lpage>15</lpage>.</citation>
</ref>
<ref id="B190">
<citation citation-type="book"><person-group person-group-type="author"><name><surname>Wang</surname> <given-names>Z.</given-names></name> <name><surname>Yang</surname> <given-names>H.</given-names></name> <name><surname>Feng</surname> <given-names>Y.</given-names></name> <name><surname>Sun</surname> <given-names>P.</given-names></name> <name><surname>Guo</surname> <given-names>H.</given-names></name> <name><surname>Zhang</surname> <given-names>Z.</given-names></name> <etal/></person-group>. (<year>2023</year>). <article-title>&#x0201C;Towards transferable targeted adversarial examples,&#x0201D;</article-title> in <source>Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition</source> (<publisher-loc>New York, NY</publisher-loc>: <publisher-name>IEEE</publisher-name>), <fpage>20534</fpage>&#x02013;<lpage>20543</lpage>.</citation>
</ref>
<ref id="B191">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Weber</surname> <given-names>L.</given-names></name> <name><surname>Lapuschkin</surname> <given-names>S.</given-names></name> <name><surname>Binder</surname> <given-names>A.</given-names></name> <name><surname>Samek</surname> <given-names>W.</given-names></name></person-group> (<year>2023</year>). <article-title>Beyond explaining: opportunities and challenges of XAI-based model improvement</article-title>. <source>Inf. Fus</source>. <volume>92</volume>, <fpage>154</fpage>&#x02013;<lpage>176</lpage>. <pub-id pub-id-type="doi">10.1016/j.inffus.2022.11.013</pub-id><pub-id pub-id-type="pmid">39122889</pub-id></citation></ref>
<ref id="B192">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Wei</surname> <given-names>K.</given-names></name> <name><surname>Li</surname> <given-names>J.</given-names></name> <name><surname>Ding</surname> <given-names>M.</given-names></name> <name><surname>Ma</surname> <given-names>C.</given-names></name> <name><surname>Yang</surname> <given-names>H. H.</given-names></name> <name><surname>Farokhi</surname> <given-names>F.</given-names></name> <etal/></person-group>. (<year>2020</year>). <article-title>Federated learning with differential privacy: algorithms and performance analysis</article-title>. <source>IEEE Trans. Inf. Forensics Secur</source>. <volume>15</volume>, <fpage>3454</fpage>&#x02013;<lpage>3469</lpage>. <pub-id pub-id-type="doi">10.1109/TIFS.2020.2988575</pub-id></citation>
</ref>
<ref id="B193">
<citation citation-type="book"><person-group person-group-type="author"><name><surname>Weisz</surname> <given-names>J. D.</given-names></name> <name><surname>He</surname> <given-names>J.</given-names></name> <name><surname>Muller</surname> <given-names>M.</given-names></name> <name><surname>Hoefer</surname> <given-names>G.</given-names></name> <name><surname>Miles</surname> <given-names>R.</given-names></name> <name><surname>Geyer</surname> <given-names>W.</given-names></name></person-group> (<year>2024</year>). <article-title>&#x0201C;Design principles for generative ai applications,&#x0201D;</article-title> in <source>Proceedings of the CHI Conference on Human Factors in Computing Systems</source> (<publisher-loc>New York, NY</publisher-loc>: <publisher-name>ACM</publisher-name>), <fpage>1</fpage>&#x02013;<lpage>22</lpage>.</citation>
</ref>
<ref id="B194">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Weng</surname> <given-names>T. W.</given-names></name> <name><surname>Zhang</surname> <given-names>H.</given-names></name> <name><surname>Chen</surname> <given-names>P. Y.</given-names></name> <name><surname>Yi</surname> <given-names>J.</given-names></name> <name><surname>Su</surname> <given-names>D.</given-names></name> <name><surname>Gao</surname> <given-names>Y.</given-names></name> <etal/></person-group>. (<year>2018</year>). <article-title>&#x0201C;Evaluating the robustness of neural networks: an extreme value theory approach,&#x0201D;</article-title> in <source>6th International Conference on Learning Representations, ICLR 2018</source>, <fpage>1</fpage>&#x02013;<lpage>18</lpage>.</citation>
</ref>
<ref id="B195">
<citation citation-type="book"><person-group person-group-type="author"><name><surname>Wieringa</surname> <given-names>M.</given-names></name></person-group> (<year>2020</year>). <article-title>&#x0201C;What to account for when accounting for algorithms: a systematic literature review on algorithmic accountability,&#x0201D;</article-title> in <source>Proceedings of the 2020 Conference on Fairness, Accountability, and Transparency, FAT* &#x00027;20</source> (<publisher-loc>New York, NY</publisher-loc>: <publisher-name>Association for Computing Machinery</publisher-name>), <fpage>1</fpage>&#x02013;<lpage>18</lpage>.</citation>
</ref>
<ref id="B196">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Wing</surname> <given-names>J. M.</given-names></name></person-group> (<year>2021</year>). <article-title>Trustworthy AI</article-title>. <source>Commun. ACM</source> <volume>64</volume>, <fpage>64</fpage>&#x02013;<lpage>71</lpage>. <pub-id pub-id-type="doi">10.1145/3448248</pub-id></citation>
</ref>
<ref id="B197">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Winter</surname> <given-names>P. M.</given-names></name> <name><surname>Eder</surname> <given-names>S.</given-names></name> <name><surname>Weissenb&#x000F6;ck</surname> <given-names>J.</given-names></name> <name><surname>Schwald</surname> <given-names>C.</given-names></name> <name><surname>Doms</surname> <given-names>T.</given-names></name> <name><surname>Vogt</surname> <given-names>T.</given-names></name> <etal/></person-group>. (<year>2021</year>). <article-title>Trusted artificial intelligence: towards certification of machine learning applications</article-title>. <source>arXiv</source> [preprint]. <pub-id pub-id-type="doi">10.48550/arXiv.2103.16910</pub-id></citation>
</ref>
<ref id="B198">
<citation citation-type="book"><person-group person-group-type="author"><name><surname>Wolf</surname> <given-names>C. T.</given-names></name></person-group> (<year>2019</year>). <article-title>&#x0201C;Explainability scenarios: towards scenario-based XAI design,&#x0201D;</article-title> in <source>Proceedings of the 24th International Conference on Intelligent User Interfaces</source> (<publisher-loc>New York, NY</publisher-loc>: <publisher-name>ACM</publisher-name>), <fpage>252</fpage>&#x02013;<lpage>257</lpage>.</citation>
</ref>
<ref id="B199">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Xia</surname> <given-names>B.</given-names></name> <name><surname>Lu</surname> <given-names>Q.</given-names></name> <name><surname>Zhu</surname> <given-names>L.</given-names></name> <name><surname>Lee</surname> <given-names>S. U.</given-names></name> <name><surname>Liu</surname> <given-names>Y.</given-names></name> <name><surname>Xing</surname> <given-names>Z.</given-names></name></person-group> (<year>2024</year>). <article-title>&#x0201C;Towards a responsible AI metrics catalogue: a collection of metrics for ai accountability,&#x0201D;</article-title> in <source>Proceedings of the IEEE/ACM 3rd International Conference on AI Engineering</source> - <italic>Software Engineering for AI, CAIN &#x00027;24</italic> (New York, NY: Association for Computing Machinery), <fpage>100</fpage>&#x02013;<lpage>111</lpage>.</citation>
</ref>
<ref id="B200">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Xu</surname> <given-names>H.</given-names></name> <name><surname>Ma</surname> <given-names>Y.</given-names></name> <name><surname>Liu</surname> <given-names>H.-C.</given-names></name> <name><surname>Deb</surname> <given-names>D.</given-names></name> <name><surname>Liu</surname> <given-names>H.</given-names></name> <name><surname>Tang</surname> <given-names>J.-L.</given-names></name> <etal/></person-group>. (<year>2020</year>). <article-title>Adversarial attacks and defenses in images, graphs and text: A Review</article-title>. <source>Int. J. Automat. Comp</source>. <volume>17</volume>, <fpage>151</fpage>&#x02013;<lpage>178</lpage>. <pub-id pub-id-type="doi">10.1007/s11633-019-1211-x</pub-id></citation>
</ref>
<ref id="B201">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Yeung</surname> <given-names>K.</given-names></name></person-group> (<year>2020</year>). <article-title>Recommendation of the council on artificial intelligence (OECD)</article-title>. <source>Int. Legal Mater</source>. <volume>59</volume>, <fpage>27</fpage>&#x02013;<lpage>34</lpage>. <pub-id pub-id-type="doi">10.1017/ilm.2020.5</pub-id><pub-id pub-id-type="pmid">32990065</pub-id></citation></ref>
<ref id="B202">
<citation citation-type="book"><person-group person-group-type="author"><name><surname>Yin</surname> <given-names>H.</given-names></name> <name><surname>Mallya</surname> <given-names>A.</given-names></name> <name><surname>Vahdat</surname> <given-names>A.</given-names></name> <name><surname>&#x000C1;lvarez</surname> <given-names>J. M.</given-names></name> <name><surname>Kautz</surname> <given-names>J.</given-names></name> <name><surname>Molchanov</surname> <given-names>P.</given-names></name></person-group> (<year>2021</year>). <article-title>&#x0201C;See through gradients: image batch recovery via gradinversion,&#x0201D;</article-title> in <source>IEEE Conference on Computer Vision and Pattern Recognition, CVPR 2021, virtual</source> (<publisher-loc>New York, NY</publisher-loc>: <publisher-name>IEEE</publisher-name>), <fpage>16337</fpage>&#x02013;<lpage>16346</lpage>.</citation>
</ref>
<ref id="B203">
<citation citation-type="book"><person-group person-group-type="author"><name><surname>Young</surname> <given-names>K.</given-names></name> <name><surname>Booth</surname> <given-names>G.</given-names></name> <name><surname>Simpson</surname> <given-names>B.</given-names></name> <name><surname>Dutton</surname> <given-names>R.</given-names></name> <name><surname>Shrapnel</surname> <given-names>S.</given-names></name></person-group> (<year>2019</year>). <article-title>&#x0201C;Deep neural network or dermatologist?,&#x0201D;</article-title> in <source>Interpretability of Machine Intelligence in Medical Image Computing and Multimodal Learning for Clinical Decision Support: Second International Workshop, iMIMIC 2019, and 9th International Workshop, ML-CDS 2019, Held in Conjunction with MICCAI 2019, Shenzhen, China, October 17, 2019, Proceedings 9</source> (<publisher-loc>New York, NY</publisher-loc>: <publisher-name>Springer</publisher-name>), <fpage>48</fpage>&#x02013;<lpage>55</lpage>.</citation>
</ref>
<ref id="B204">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Zaeem</surname> <given-names>R. N.</given-names></name> <name><surname>Barber</surname> <given-names>K. S.</given-names></name></person-group> (<year>2020</year>). <article-title>The effect of the gdpr on privacy policies: recent progress and future promise</article-title>. <source>ACM Transact. Manag. Inf. Syst</source>. <volume>12</volume>, <fpage>1</fpage>&#x02013;<lpage>20</lpage>. <pub-id pub-id-type="doi">10.1145/3389685</pub-id></citation>
</ref>
<ref id="B205">
<citation citation-type="book"><person-group person-group-type="author"><name><surname>Zemel</surname> <given-names>R.</given-names></name> <name><surname>Wu</surname> <given-names>Y.</given-names></name> <name><surname>Swersky</surname> <given-names>K.</given-names></name> <name><surname>Pitassi</surname> <given-names>T.</given-names></name> <name><surname>Dwork</surname> <given-names>C.</given-names></name></person-group> (<year>2013</year>). <article-title>&#x0201C;Learning fair representations,&#x0201D;</article-title> in <source>International Conference on Machine Learning</source> (<publisher-loc>PMLR</publisher-loc>), <fpage>325</fpage>&#x02013;<lpage>333</lpage>.</citation>
</ref>
<ref id="B206">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Zhang</surname> <given-names>C.</given-names></name> <name><surname>Xie</surname> <given-names>Y.</given-names></name> <name><surname>Bai</surname> <given-names>H.</given-names></name> <name><surname>Yu</surname> <given-names>B.</given-names></name> <name><surname>Li</surname> <given-names>W.</given-names></name> <name><surname>Gao</surname> <given-names>Y.</given-names></name></person-group> (<year>2021</year>). <article-title>A survey on federated learning</article-title>. <source>Knowl. Based Syst</source>. <volume>216</volume>:<fpage>106775</fpage>. <pub-id pub-id-type="doi">10.1016/j.knosys.2021.106775</pub-id></citation>
</ref>
<ref id="B207">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Zhao</surname> <given-names>L.</given-names></name> <name><surname>Hu</surname> <given-names>Q.</given-names></name> <name><surname>Wang</surname> <given-names>W.</given-names></name></person-group> (<year>2015</year>). <article-title>Heterogeneous feature selection with multi-modal deep neural networks and sparse group lasso</article-title>. <source>IEEE Transact. Multim</source>. <volume>17</volume>, <fpage>1936</fpage>&#x02013;<lpage>1948</lpage>. <pub-id pub-id-type="doi">10.1109/TMM.2015.2477058</pub-id></citation>
</ref>
<ref id="B208">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Zhu</surname> <given-names>X.</given-names></name> <name><surname>Wu</surname> <given-names>X.</given-names></name></person-group> (<year>2004</year>). <article-title>Class noise vs. attribute noise: a quantitative study</article-title>. <source>Artif. Intell. Rev</source>. <volume>22</volume>, <fpage>177</fpage>&#x02013;<lpage>210</lpage>. <pub-id pub-id-type="doi">10.1007/s10462-004-0751-8</pub-id></citation>
</ref>
<ref id="B209">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Zhuang</surname> <given-names>F.</given-names></name> <name><surname>Qi</surname> <given-names>Z.</given-names></name> <name><surname>Duan</surname> <given-names>K.</given-names></name> <name><surname>Xi</surname> <given-names>D.</given-names></name> <name><surname>Zhu</surname> <given-names>Y.</given-names></name> <name><surname>Zhu</surname> <given-names>H.</given-names></name> <etal/></person-group>. (<year>2020</year>). <article-title>A comprehensive survey on transfer learning</article-title>. <source>Proc. IEEE</source> <volume>109</volume>, <fpage>43</fpage>&#x02013;<lpage>76</lpage>. <pub-id pub-id-type="doi">10.1109/JPROC.2020.3004555</pub-id></citation>
</ref>
<ref id="B210">
<citation citation-type="book"><person-group person-group-type="author"><name><surname>Zimmerman</surname> <given-names>M.</given-names></name></person-group> (<year>2018</year>). <source>Teaching AI: Exploring new frontiers for learning</source>. <publisher-loc>Arlington, VA</publisher-loc>: <publisher-name>International Society for Technology in Education</publisher-name>.<pub-id pub-id-type="pmid">24092470</pub-id></citation></ref>
<ref id="B211">
<citation citation-type="book"><person-group person-group-type="author"><name><surname>Zimmermann-Niefield</surname> <given-names>A.</given-names></name> <name><surname>Turner</surname> <given-names>M.</given-names></name> <name><surname>Murphy</surname> <given-names>B.</given-names></name> <name><surname>Kane</surname> <given-names>S. K.</given-names></name> <name><surname>Shapiro</surname> <given-names>R. B.</given-names></name></person-group> (<year>2019</year>). <article-title>&#x0201C;Youth learning machine learning through building models of athletic moves,&#x0201D;</article-title> in <source>Proceedings of the 18th ACM International Conference on Interaction Design and Children</source> (<publisher-loc>New York, NY</publisher-loc>: <publisher-name>ACM</publisher-name>), <fpage>121</fpage>&#x02013;<lpage>132</lpage>.</citation>
</ref>
<ref id="B212">
<citation citation-type="book"><person-group person-group-type="author"><name><surname>Zou</surname> <given-names>Y.</given-names></name> <name><surname>Schaub</surname> <given-names>F.</given-names></name></person-group> (<year>2018</year>). <article-title>&#x0201C;Concern but no action: consumers&#x00027; reactions to the equifax data breach,&#x0201D;</article-title> in <source>Extended Abstracts of the 2018 CHI Conference on Human Factors in Computing Systems</source> (<publisher-loc>New York, NY</publisher-loc>: <publisher-name>ACM</publisher-name>), <fpage>1</fpage>&#x02013;<lpage>6</lpage>.</citation>
</ref>
</ref-list>
</back>
</article>