<?xml version="1.0" encoding="utf-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.3 20070202//EN" "journalpublishing.dtd">
<article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" article-type="research-article" dtd-version="2.3" xml:lang="EN">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Psychol.</journal-id>
<journal-title>Frontiers in Psychology</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Psychol.</abbrev-journal-title>
<issn pub-type="epub">1664-1078</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="doi">10.3389/fpsyg.2024.1292808</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Psychology</subject>
<subj-group>
<subject>Original Research</subject>
</subj-group>
</subj-group>
</article-categories>
<title-group>
<article-title>The influence of social feedback on reward learning in the Iowa gambling task</article-title>
</title-group>
<contrib-group>
<contrib contrib-type="author">
<name><surname>Peng</surname> <given-names>Ming</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
<xref ref-type="aff" rid="aff3"><sup>3</sup></xref>
<uri xlink:href="https://loop.frontiersin.org/people/1262450/overview"/>
<role content-type="https://credit.niso.org/contributor-roles/conceptualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
<role content-type="https://credit.niso.org/contributor-roles/methodology/"/>
<role content-type="https://credit.niso.org/contributor-roles/project-administration/"/>
<role content-type="https://credit.niso.org/contributor-roles/resources/"/>
<role content-type="https://credit.niso.org/contributor-roles/supervision/"/>
<role content-type="https://credit.niso.org/contributor-roles/validation/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Duan</surname> <given-names>Qiaochu</given-names></name>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
<uri xlink:href="https://loop.frontiersin.org/people/2431899/overview"/>
<role content-type="https://credit.niso.org/contributor-roles/formal-analysis/"/>
<role content-type="https://credit.niso.org/contributor-roles/methodology/"/>
<role content-type="https://credit.niso.org/contributor-roles/software/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Yang</surname> <given-names>Xiaoying</given-names></name>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
<uri xlink:href="https://loop.frontiersin.org/people/2152474/overview"/>
<role content-type="https://credit.niso.org/contributor-roles/methodology/"/>
<role content-type="https://credit.niso.org/contributor-roles/project-administration/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Tang</surname> <given-names>Rui</given-names></name>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
<uri xlink:href="https://loop.frontiersin.org/people/2132637/overview"/>
<role content-type="https://credit.niso.org/contributor-roles/methodology/"/>
<role content-type="https://credit.niso.org/contributor-roles/project-administration/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Zhang</surname> <given-names>Lei</given-names></name>
<xref ref-type="aff" rid="aff4"><sup>4</sup></xref>
<xref ref-type="aff" rid="aff5"><sup>5</sup></xref>
<uri xlink:href="https://loop.frontiersin.org/people/639322/overview"/>
<role content-type="https://credit.niso.org/contributor-roles/supervision/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Zhang</surname> <given-names>Hanshu</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
<xref ref-type="aff" rid="aff3"><sup>3</sup></xref>
<uri xlink:href="https://loop.frontiersin.org/people/2578261/overview"/>
<role content-type="https://credit.niso.org/contributor-roles/supervision/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name><surname>Li</surname> <given-names>Xu</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
<xref ref-type="aff" rid="aff3"><sup>3</sup></xref>
<xref ref-type="corresp" rid="c001"><sup>&#x002A;</sup></xref>
<uri xlink:href="https://loop.frontiersin.org/people/643140/overview"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
</contrib-group>
<aff id="aff1"><sup>1</sup><institution>Key Laboratory of Adolescent Cyberpsychology and Behavior (CCNU), Ministry of Education</institution>, <addr-line>Wuhan</addr-line>, <country>China</country></aff>
<aff id="aff2"><sup>2</sup><institution>School of Psychology, Central China Normal University</institution>, <addr-line>Wuhan</addr-line>, <country>China</country></aff>
<aff id="aff3"><sup>3</sup><institution>Key Laboratory of Human Development and Mental Health of Hubei Province</institution>, <addr-line>Wuhan</addr-line>, <country>China</country></aff>
<aff id="aff4"><sup>4</sup><institution>Centre for Human Brain Health, School of Psychology, University of Birmingham</institution>, <addr-line>Birmingham</addr-line>, <country>United Kingdom</country></aff>
<aff id="aff5"><sup>5</sup><institution>Institute for Mental Health, School of Psychology, University of Birmingham</institution>, <addr-line>Birmingham</addr-line>, <country>United Kingdom</country></aff>
<author-notes>
<fn fn-type="edited-by" id="fn0001">
<p>Edited by: Igor Kagan, Deutsches Primatenzentrum, Germany</p>
</fn>
<fn fn-type="edited-by" id="fn0002">
<p>Reviewed by: Julia Case, Columbia University, United States</p>
<p>Kieran Stephen Mohr, University College Dublin, Ireland</p>
</fn>
<corresp id="c001">&#x002A;Correspondence: Xu Li, <email>xuli@ccnu.edu.cn</email></corresp>
</author-notes>
<pub-date pub-type="epub">
<day>02</day>
<month>05</month>
<year>2024</year>
</pub-date>
<pub-date pub-type="collection">
<year>2024</year>
</pub-date>
<volume>15</volume>
<elocation-id>1292808</elocation-id>
<history>
<date date-type="received">
<day>18</day>
<month>09</month>
<year>2023</year>
</date>
<date date-type="accepted">
<day>17</day>
<month>04</month>
<year>2024</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#x00A9; 2024 Peng, Duan, Yang, Tang, Zhang, Zhang and Li.</copyright-statement>
<copyright-year>2024</copyright-year>
<copyright-holder>Peng, Duan, Yang, Tang, Zhang, Zhang and Li</copyright-holder>
<license xlink:href="http://creativecommons.org/licenses/by/4.0/">
<p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (CC BY). The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</p>
</license>
</permissions>
<abstract>
<p>Learning, an important activity for both human and animals, has long been a focal point of research. During the learning process, subjects assimilate not only their own information but also information from others, a phenomenon known as social learning. While numerous studies have explored the impact of social feedback as a reward/punishment during learning, few studies have investigated whether social feedback facilitates or inhibits the learning of environmental rewards/punishments. This study aims to test the effects of social feedback on economic feedback and its cognitive processes by using the Iowa Gambling Task (IGT). One hundred ninety-two participants were recruited and categorized into one non-social feedback group and four social feedback groups. Participants in the social feedback groups were informed that after the outcome of each choice, they would also receive feedback from an online peer. This peer was a fictitious entity, with variations in identity (novice or expert) and feedback type (random or effective). The Outcome-Representation Learning model (ORL model) was used to quantify the cognitive components of learning. Behavioral results showed that both the identity of the peer and the type of feedback provided significantly influenced the deck selection, with effective social feedback increasing the ratio of chosen good decks. Results in the ORL model showed that the four social feedback groups exhibited lower learning rates for gain and loss compared to the nonsocial feedback group, which suggested, in the social feedback groups, the impact of the recent outcome on the update of value decreased. Parameters such as forgetfulness, win frequency, and deck perseverance in the expert-effective feedback group were significantly higher than those in the non-social feedback and expert-random feedback groups. These findings suggest that individuals proactively evaluate feedback providers and selectively adopt effective feedback to enhance learning.</p>
</abstract>
<kwd-group>
<kwd>social feedback</kwd>
<kwd>reward learning</kwd>
<kwd>Iowa gambling task</kwd>
<kwd>computational model</kwd>
<kwd>feedback type</kwd>
<kwd>identity</kwd>
</kwd-group>
<counts>
<fig-count count="5"/>
<table-count count="4"/>
<equation-count count="0"/>
<ref-count count="45"/>
<page-count count="10"/>
<word-count count="7929"/>
</counts>
<custom-meta-wrap>
<custom-meta>
<meta-name>section-at-acceptance</meta-name>
<meta-value>Decision Neuroscience</meta-value>
</custom-meta>
</custom-meta-wrap>
</article-meta>
</front>
<body>
<sec sec-type="intro" id="sec1">
<label>1</label>
<title>Introduction</title>
<p>Learning is a central topic in psychological research and questions about learning have been addressed in virtually all areas of psychology (<xref ref-type="bibr" rid="ref12">De Houwer et al., 2013</xref>). Social learning is broadly defined as learning from or through interaction with other individuals. This form of learning is often adaptive because it allows learning about the world while minimizing exposure to predation and other threats and offers access to others&#x2019; innovations (<xref ref-type="bibr" rid="ref32">Olsson et al., 2020</xref>). People, even young children, draw rich inferences from the evidence provided by others and generate informative evidence that helps them learn (<xref ref-type="bibr" rid="ref15">Gweon, 2021</xref>).</p>
<p>Social information can be gleaned either by observing others&#x2019; behavior (<xref ref-type="bibr" rid="ref8">Charpentier et al., 2020</xref>; <xref ref-type="bibr" rid="ref42">Zhang et al., 2020</xref>; <xref ref-type="bibr" rid="ref43">Zhao et al., 2023</xref>) or by following explicit advice or social feedback (<xref ref-type="bibr" rid="ref17">Harris, 2012</xref>; <xref ref-type="bibr" rid="ref9">Colombo et al., 2014</xref>; <xref ref-type="bibr" rid="ref37">Van der Borght et al., 2016</xref>; <xref ref-type="bibr" rid="ref20">Hertz et al., 2021</xref>; <xref ref-type="bibr" rid="ref44">Zonca et al., 2021</xref>; <xref ref-type="bibr" rid="ref33">Schindler et al., 2022</xref>). Processing social feedback is essential for social learning, imitation, and adaptation; thus, it plays a crucial role in daily life (<xref ref-type="bibr" rid="ref38">V&#x00E9;lez and Gweon, 2021</xref>; <xref ref-type="bibr" rid="ref41">Zhang et al., 2022</xref>). Dozens of laboratory and field studies have shown that humans effectively shape others&#x2019; behavior through the use of selective rewards and punishments (<xref ref-type="bibr" rid="ref23">Ho et al., 2017</xref>, <xref ref-type="bibr" rid="ref22">2019</xref>).</p>
<p>Compared with other social information, social feedback not only provides information about the world, but also provides a positive feeling (<xref ref-type="bibr" rid="ref22">Ho et al., 2019</xref>). For example, teacher feedback can both improve achievement and foster pride. Therefore, there are at least two types of social feedback: social feedback itself as a reward/punishment, and social feedback that facilitates the function of an environmental or physical reward/punishment (usually a monetary incentive). For example, social feedback influences the processing of gain or loss in economic decisions (<xref ref-type="bibr" rid="ref31">Namba, 2021</xref>). The following questions are worth investigating: does the acquisition of knowledge through social rewards and punishments differ from that of feedback derived from conventional environmental or physical rewards and punishments? How do the two distinct forms of feedback interact with one another? Although some evidence suggests that shared neural regions are involved in processing social and physical feedback (<xref ref-type="bibr" rid="ref25">Izuma et al., 2008</xref>; <xref ref-type="bibr" rid="ref28">Lin et al., 2012</xref>), the precise nature of their interactions remains largely unexplored. This study aims to address this knowledge gap.</p>
<p>The Iowa Gambling Task (IGT) is a reward-learning task relying on monetary feedback (<xref ref-type="bibr" rid="ref4">Bechara et al., 1994</xref>). With the IGT, participants are required to choose four decks that will elicit feedback in the form of either a reward or punishment, and aim to obtain as great a reward as possible. Two of the decks have smaller immediate rewards, but result in greater net gains (classified as good decks), and two decks are associated with larger immediate rewards, but result in greater net losses (classified as bad decks; <xref ref-type="bibr" rid="ref4">Bechara et al., 1994</xref>). Normally, participants in the IGT adopt an explore-exploit strategy in which they first explore different decks and then exploit the most profitable one when they find the best deck (<xref ref-type="bibr" rid="ref4">Bechara et al., 1994</xref>; <xref ref-type="bibr" rid="ref30">Must et al., 2006</xref>; <xref ref-type="bibr" rid="ref1">Agay et al., 2010</xref>; <xref ref-type="bibr" rid="ref31">Namba, 2021</xref>).</p>
<p>Many studies have focused on how different people react to environmental feedback in the IGT (<xref ref-type="bibr" rid="ref7">Cauffman et al., 2010</xref>; <xref ref-type="bibr" rid="ref29">Mukherjee and Kable, 2014</xref>; <xref ref-type="bibr" rid="ref19">Hayes and Wedell, 2020b</xref>; <xref ref-type="bibr" rid="ref14">Garon and English, 2021</xref>; <xref ref-type="bibr" rid="ref34">Serrano et al., 2022</xref>). However, few recent studies have focused on the influence of social feedback in the task (<xref ref-type="bibr" rid="ref5">Case and Olino, 2020</xref>). One study examined learning patterns in response to both monetary and social incentives using modified versions of the IGT in a sample of 191 undergraduate students. The social feedback consisted of facial images displaying positive and negative emotions. The results showed that participants demonstrated learning in both the monetary and social tasks, as shown by decreases in play on bad decks across the task. Additionally, they found that overall task performance on monetary and social tasks was associated with fun-seeking, and that performance on the social task was also associated with depressive symptoms (<xref ref-type="bibr" rid="ref5">Case and Olino, 2020</xref>).</p>
<p>As mentioned before, social feedback can be used as a reward/punishment, or to facilitate the function of an environmental reward/punishment. Previous studies using the IGT have dealt with the former case (e.g., <xref ref-type="bibr" rid="ref28">Lin et al., 2012</xref>; <xref ref-type="bibr" rid="ref36">Thompson and Westwater, 2017</xref>; <xref ref-type="bibr" rid="ref5">Case and Olino, 2020</xref>); however, to the best of our knowledge, only one study has investigated the latter case (<xref ref-type="bibr" rid="ref31">Namba, 2021</xref>). That study investigated whether learning can be promoted by adding feedback in the form of facial expressions to the normal monetary feedback provided in the IGT. To ascertain the effect of facial-expression feedback, the researchers added a control condition that included feedback in the form of symbols (&#x25CB; and &#x00D7;). &#x25CB; has conventionally been used as feedback for positive or correct evaluations, while &#x00D7; has been used as feedback for negative or incorrect evaluations. These two conditions were similar in that both provided information and monetary feedback. The results revealed that the learning rate for facial expression feedback was slower in the middle of the task period than that for symbolic feedback (<xref ref-type="bibr" rid="ref31">Namba, 2021</xref>). Although this study demonstrated that social feedback affects reward learning, the underlying mechanism remains unknown.</p>
<p>Researchers have studied the conditions under which individuals rely on information from social sources to inform their behavior, which is known as Social Learning Strategies (SLS) (<xref ref-type="bibr" rid="ref27">Laland, 2004</xref>). These strategies, referred to as &#x201C;transmission biases&#x201D; or &#x201C;heuristics&#x201D; are thought to lead individuals to imitate certain behaviors (known as &#x201C;what&#x201D; strategies), performed by certain individuals (known as &#x201C;who&#x201D; strategies), in certain contexts (known as &#x201C;when&#x201D; strategies) (<xref ref-type="bibr" rid="ref26">Kendal et al., 2018</xref>). However, they are not used indiscriminately. Through theoretical modeling and empirical evidence, it has been suggested that humans and non-human animals employ strategies such as copying when uncertain, copying the majority, and copying authoritative individuals, as the use of social information does not guarantee success (<xref ref-type="bibr" rid="ref21">Heyes, 2012</xref>; <xref ref-type="bibr" rid="ref32">Olsson et al., 2020</xref>). The objective of this study was to examine two distinct aspects of feedback, namely the effectiveness of feedback on &#x201C;what&#x201D; strategies and the role of the feedback provider&#x2019;s identity in &#x201C;who&#x201D; strategies according to SLS.</p>
<p>Learning from social feedback is an important form of social learning, however, it is still unclear how social feedback affects the internal cognitive process of environmental reward/punishment learning. Using a computational model, we can analyze the decision-making process into its components. Multiple computational models have been proposed, three of which were proposed by Ahn and colleagues, including the Prospect Valence Learning model with Delta rule (PVL-Delta) (<xref ref-type="bibr" rid="ref2">Ahn et al., 2008</xref>), Value-Plus-Perseverance model (VPP) (<xref ref-type="bibr" rid="ref3">Ahn et al., 2014</xref>), and Outcome-Representation Learning model (ORL) (<xref ref-type="bibr" rid="ref16">Haines et al., 2018</xref>). Their latest model, ORL, contains five free parameters, reward learning (A<sub>rew</sub>), punishment learning (A<sub>pun</sub>), forgetfulness (K), win frequency (&#x03B2;<sub>F</sub>), and deck perseverance (&#x03B2;<sub>P</sub>). A<sub>rew</sub> (0&#x2009;&#x003C;&#x2009;A<sub>rew</sub>&#x2009;&#x003C;&#x2009;1) and A<sub>pun</sub> (0&#x2009;&#x003C;&#x2009;A<sub>pun</sub>&#x2009;&#x003C;&#x2009;1) are learning rates used to update expectations after reward (i.e., positive) and punishment (i.e., negative) outcomes, respectively. When the learning rate is high, the most recent outcomes matter for the value update, whereas when the learning rate is low, the impact of the value of the most recent outcomes on the value update decreases (<xref ref-type="bibr" rid="ref9001">Rescorla and Wagner, 1972</xref>; <xref ref-type="bibr" rid="ref42">Zhang et al., 2020</xref>). K is a decay parameter that controls how quickly decision-makers forget their past deck choices, where lower values imply longer lasting memories of past choices. Values for &#x03B2;<sub>F</sub> (&#x2212;&#x221E;&#x2009;&#x003C;&#x2009;&#x03B2;<sub>F</sub>&#x2009;&#x003C;&#x2009;+&#x221E;) less than or greater than 0 indicate that people prefer decks with a low or high win frequency, and values for &#x03B2;<sub>P</sub> (&#x2212;&#x221E;&#x2009;&#x003C;&#x2009;&#x03B2;<sub>P</sub>&#x2009;&#x003C;&#x2009;+&#x221E;) less or greater than 0 indicate that people prefer to switch or stay with recently chosen decks. ORL outperformed the previous two learning reinforcement models (PVL-Delta and VPP) in terms of prediction accuracy and parameter recovery (<xref ref-type="bibr" rid="ref16">Haines et al., 2018</xref>).</p>
<p>We integrate the identity and behavioral characteristics of feedback providers to examine how different characteristics affect an individual&#x2019;s learning. Two different learning performances were used. The first pertains to the chosen rate of good decks, serving as an indicator of behavioral performance. We hypothesized that better task performance would be observed when the social feedback was more effective than random or no social feedback. The second is the learning rate (A<sub>rew</sub> and A<sub>pun</sub>), which was an index of internal cognitive processes, analyzed through a computational model. In examining the relationship between learning rate and performance, findings have been inconsistent (<xref ref-type="bibr" rid="ref10">Cutler et al., 2021</xref>; <xref ref-type="bibr" rid="ref39">Westhoff et al., 2021</xref>). Notably, regarding whether a higher learning rate leads to better performance, we propose that in situations characterized by environmental stability and adequate instructional guidance, a lower learning rate is anticipated. Therefore, we hypothesized that a lower learning rate would be observed when feedback is effective and when the feedback provider is an expert.</p>
</sec>
<sec sec-type="methods" id="sec2">
<label>2</label>
<title>Methods</title>
<sec id="sec3">
<label>2.1</label>
<title>Participants</title>
<p>A prior power analysis was conducted using G&#x002A;Power v.3.1 (<xref ref-type="bibr" rid="ref13">Faul et al., 2007</xref>) to determine the sample size for the nonsocial and social feedback settings. For the nonsocial setting, 24 participants were required with an alpha of 0.05, power (1 &#x2013; &#x03B2;) of 0.80, and a medium effect size of 0.25 for the within-group effect. For the social setting, 128 participants were required with an alpha of 0.05, power of 0.80, and a medium effect size of 0.25 for the within-between interaction effect. In total, 39 participants (25 females, mean&#x2009;&#x00B1;&#x2009;SE&#x2009;=&#x2009;20.6&#x2009;&#x00B1;&#x2009;2.6) were recruited for the nonsocial setting and 153 participants (109 females, mean&#x2009;&#x00B1;&#x2009;SE&#x2009;=&#x2009;20.1&#x2009;&#x00B1;&#x2009;2.1) were recruited for the social setting from a university located in Wuhan, Hubei province.</p>
<p>All participants were in good physical and mental health and were informed of the experiment procedure, rewards, and risks. Monetary rewards were dispensed after the experiment based on participants&#x2019; performance, with a range of 8&#x2013;10 Chinese yuan given as a participation fee.</p>
</sec>
<sec id="sec4">
<label>2.2</label>
<title>Iowa gambling task</title>
<p>Participants in the modified version of the Iowa Gambling Task (IGT) were presented with four decks labeled D, F, J, and K, which corresponded to four specific decks of cards randomly assigned (referred to as A, B, C, and D). Each deck of cards had two properties: gain and loss. The good decks (C and D) had an expected value of 25 yuan, while the bad decks (A and B) had an expected value of &#x2212;25 yuan. Additionally, the decks differed in loss frequency: good deck C and bad deck A had frequent mixed outcomes (5 losses out of every 10 cards), while the other decks (B and D) had infrequent mixed outcomes (1 loss out of every 10 cards). The starting outcome was 0. The detailed payoff was shown in <xref ref-type="table" rid="tab1">Table 1</xref>.</p>
<table-wrap position="float" id="tab1">
<label>Table 1</label>
<caption>
<p>The schedule of gain and loss in the four decks of the card task used in the task.</p>
</caption>
<table frame="hsides" rules="groups">
<thead>
<tr>
<th align="left" valign="top">Deck</th>
<th align="center" valign="top">Outcome</th>
<th align="center" valign="top" colspan="10">Payoff in per 10 trials</th>
<th align="center" valign="top">Net</th>
</tr>
</thead>
<tbody>
<tr>
<td align="left" valign="top" rowspan="2">A</td>
<td align="center" valign="top">Gain</td>
<td align="center" valign="middle">8</td>
<td align="center" valign="middle">9</td>
<td align="center" valign="middle">10</td>
<td align="center" valign="middle">11</td>
<td align="center" valign="middle">12</td>
<td align="center" valign="middle">8</td>
<td align="center" valign="middle">9</td>
<td align="center" valign="middle">10</td>
<td align="center" valign="middle">11</td>
<td align="center" valign="middle">12</td>
<td align="center" valign="top" rowspan="2">&#x2212;2.5</td>
</tr>
<tr>
<td align="center" valign="top">Loss</td>
<td align="center" valign="middle">0</td>
<td align="center" valign="middle">0</td>
<td align="center" valign="middle">0</td>
<td align="center" valign="middle">0</td>
<td align="center" valign="middle">0</td>
<td align="center" valign="middle">&#x2212;15</td>
<td align="center" valign="middle">&#x2212;20</td>
<td align="center" valign="middle">&#x2212;25</td>
<td align="center" valign="middle">&#x2212;30</td>
<td align="center" valign="middle">&#x2212;35</td>
</tr>
<tr>
<td align="left" valign="top" rowspan="2">B</td>
<td align="center" valign="top">Gain</td>
<td align="center" valign="middle">8</td>
<td align="center" valign="middle">9</td>
<td align="center" valign="middle">10</td>
<td align="center" valign="middle">11</td>
<td align="center" valign="middle">12</td>
<td align="center" valign="middle">8</td>
<td align="center" valign="middle">9</td>
<td align="center" valign="middle">10</td>
<td align="center" valign="middle">11</td>
<td align="center" valign="middle">12</td>
<td align="center" valign="top" rowspan="2">&#x2212;2.5</td>
</tr>
<tr>
<td align="center" valign="top">Loss</td>
<td align="center" valign="middle">0</td>
<td align="center" valign="middle">0</td>
<td align="center" valign="middle">0</td>
<td align="center" valign="middle">0</td>
<td align="center" valign="middle">0</td>
<td align="center" valign="middle">0</td>
<td align="center" valign="middle">0</td>
<td align="center" valign="middle">0</td>
<td align="center" valign="middle">0</td>
<td align="center" valign="middle">&#x2212;125</td>
</tr>
<tr>
<td align="left" valign="top" rowspan="2">C</td>
<td align="center" valign="top">Gain</td>
<td align="center" valign="middle">3</td>
<td align="center" valign="middle">4</td>
<td align="center" valign="middle">5</td>
<td align="center" valign="middle">6</td>
<td align="center" valign="middle">7</td>
<td align="center" valign="middle">3</td>
<td align="center" valign="middle">4</td>
<td align="center" valign="middle">5</td>
<td align="center" valign="middle">6</td>
<td align="center" valign="middle">7</td>
<td align="center" valign="top" rowspan="2">2.5</td>
</tr>
<tr>
<td align="center" valign="top">Loss</td>
<td align="center" valign="middle">0</td>
<td align="center" valign="middle">0</td>
<td align="center" valign="middle">0</td>
<td align="center" valign="middle">0</td>
<td align="center" valign="middle">0</td>
<td align="center" valign="middle">&#x2212;1</td>
<td align="center" valign="middle">&#x2212;3</td>
<td align="center" valign="middle">&#x2212;5</td>
<td align="center" valign="middle">&#x2212;7</td>
<td align="center" valign="middle">&#x2212;9</td>
</tr>
<tr>
<td align="left" valign="top" rowspan="2">D</td>
<td align="center" valign="top">Gain</td>
<td align="center" valign="middle">3</td>
<td align="center" valign="middle">4</td>
<td align="center" valign="middle">5</td>
<td align="center" valign="middle">6</td>
<td align="center" valign="middle">7</td>
<td align="center" valign="middle">3</td>
<td align="center" valign="middle">4</td>
<td align="center" valign="middle">5</td>
<td align="center" valign="middle">6</td>
<td align="center" valign="middle">7</td>
<td align="center" valign="top" rowspan="2">2.5</td>
</tr>
<tr>
<td align="center" valign="top">Loss</td>
<td align="center" valign="middle">0</td>
<td align="center" valign="middle">0</td>
<td align="center" valign="middle">0</td>
<td align="center" valign="middle">0</td>
<td align="center" valign="middle">0</td>
<td align="center" valign="middle">0</td>
<td align="center" valign="middle">0</td>
<td align="center" valign="middle">0</td>
<td align="center" valign="middle">0</td>
<td align="center" valign="middle">&#x2212;25</td>
</tr>
</tbody>
</table>
</table-wrap>
<p>Participants were randomized in terms of deck position, but the deck labels were always displayed in order from left to right, corresponding to the keyboard keys&#x2019; labels. Each trial, participants pressed the corresponding key.</p>
<p>In the non-social feedback setting, participants completed the task alone. For the social feedback setting, participants were divided into four groups and given feedback from computer-mocked partners. The partners varied in terms of feedback type and identity: those with effective feedback gave supportive feedbacks for 80 percent of good deck choices and disapproving feedbacks for 80 percent of bad deck choices, while those with random feedback gave supportive feedbacks for 80 percent of all choices and disapproving feedbacks for 20 percent of all choices. The identities of the partners were set as novices (who knew nothing about the task) and experts (who had already learnt how to find better decks). The identity of the partner was introduced to the participants before the task began.</p>
</sec>
<sec id="sec5">
<label>2.3</label>
<title>Procedure</title>
<p>Participants were tested individually in both a non-social and social feedback setting. In the social feedback setting, they were informed that they were collaborating with an anonymous partner online, who shared the same experiment screen content. Participants were given instructions on the computer screen. The experimenter highlighted the importance of winning as much money as possible, with their remuneration being contingent on the final outcome. For the social feedback group, the partner was either ignorant of the task (in the novice group) or had been provided instructions on how to find better decks (in the expert group). In actuality, the partner was simulated by a computer program and the social feedbacks were generated by a program.</p>
<p>The experiment lasted approximately 20&#x2013;30&#x2009;min and began with four decks labeled &#x201C;D,&#x201D; &#x201C;F,&#x201D; &#x201C;J,&#x201D; and &#x201C;K.&#x201D; After participants selected a deck, the choice monetary feedback was displayed for 2&#x2013;2.5&#x2009;s. In the social feedback setting, participants waited 1&#x2013;1.5&#x2009;s after receiving the choice monetary feedback, followed by the partner&#x2019;s feedback (a finger up or down picture) for 0.8&#x2009;s. The task was completed after participants finished 120 trials or two decks were all chosen. The flow chart is <xref ref-type="fig" rid="fig1">Figure 1</xref>.</p>
<fig position="float" id="fig1">
<label>Figure 1</label>
<caption>
<p>Experiments design: <bold>(A)</bold> non-social feedback condition: participants made choice from four decks and received monetary feedbacks. <bold>(B)</bold> Social feedback condition: participants chose and got monetary feedbacks as non-social condition, then they received their partners&#x2019; feedback shown as picture of thumb up or down while the partner was played by computer.</p>
</caption>
<graphic xlink:href="fpsyg-15-1292808-g001.tif"/>
</fig>
</sec>
<sec id="sec6">
<label>2.4</label>
<title>Behavioral data process</title>
<p>A repeated-measure ANOVA of 4 blocks (1&#x2013;30 trials, 31&#x2013;60 trials, 61&#x2013;90 trials, 91&#x2013;120 trials) was used to analyze the chosen rate of good decks and the group switch rate in the non-social feedback setting. Similarly, a mixed-measure ANOVA of 4 blocks (1&#x2013;30 trials, 31&#x2013;60 trials, 61&#x2013;90 trials, 91&#x2013;120 trials)&#x2009;&#x00D7;&#x2009;2 feedback types (random, effective)&#x2009;&#x00D7;&#x2009;2 identities (novice, expert), as identity and feedback type were between-subjects, was used to analyze the chosen rate of good decks and the group switch rate in the social feedback setting. This was done to investigate the participants&#x2019; behavior changing tendencies. The higher chosen rate of good decks and the higher switch rate indicated better performance in seizing the pivot of the task and higher exploratory tendencies, respectively. We also did a one-way ANOVA of group (non-social group, novice-random group, novice-effective group, expert-random group, expert-effective group) on the slope of chosen rate to get the rate at which different groups of individuals learn.</p>
<p>The behavioral results were fitted into three models: the Prospect Valence Learning model with the delta model, the Value-Plus-Perseverance model, and the Outcome-Representation model. The detailed information of these three models was presented in the <xref ref-type="supplementary-material" rid="SM1">Supplementary material</xref>. The analyses were conducted using the hbayesDM package (<xref ref-type="bibr" rid="ref9003">Ahn et al., 2017</xref>) in R (4.1.3) with an iteration of 20,000. This package utilizes hierarchical Bayesian modeling, which is more stable than traditional fitting methods such as maximum likelihood estimation, and computes both group and subject level parameters. The model parameters&#x2019; distributions and the leave one out information criterion (LOOIC) were obtained. The lower the LOOIC, the better the model is. To assess the effect of social feedback on learning, the mean of parameters from each social and nonsocial feedback group were compared. The results were the posterior distribution of mean differences of each parameter that came from four social feedback groups&#x2019; parameters distribution minus that of the nonsocial group. In the social feedback setting, the model parameters were each analyzed using a between-subjects ANOVA of 2 (feedback type: random, effective)&#x2009;&#x00D7;&#x2009;2 (identity: novice, expert). IBM SPSS Statistics 27, MATLAB R2020b and R 4.1.3 were used for data analysis and model calculation.</p>
</sec>
</sec>
<sec sec-type="results" id="sec7">
<label>3</label>
<title>Results</title>
<sec id="sec8">
<label>3.1</label>
<title>Behavior results</title>
<p>An analysis of the effect of decision-making blocks on the chosen rate of good decks (C, D) and the group switch rate in the non-social feedback group revealed a significant difference in the former (<italic>F</italic> (3,111)&#x2009;=&#x2009;15.31, <italic>p</italic>&#x2009;&#x003C;&#x2009;0.001, &#x03B7;<italic><sub>p</sub></italic><sup>2</sup>&#x2009;=&#x2009;0.29). Bonferroni&#x2019;s multiple comparisons indicated that the chosen rate of good decks in block 3 was significantly higher than that in block 1 (<italic>p</italic>&#x2009;&#x003C;&#x2009;0.001), and block 4 was significantly higher than block 1 (<italic>p</italic>&#x2009;&#x003C;&#x2009;0.001), block 2 (<italic>p</italic>&#x2009;=&#x2009;0.001) and block 3 (<italic>p</italic>&#x2009;=&#x2009;0.019), suggesting that participants demonstrated a learning effect on the decks&#x2019; properties and an increase in the chosen rate of good decks as the decision-making process progressed (<xref ref-type="fig" rid="fig2">Figure 2</xref>). No significant difference in the group switch rate among blocks was observed (<italic>F</italic> (3,111)&#x2009;=&#x2009;1.29, <italic>p</italic>&#x2009;=&#x2009;0.23).</p>
<fig position="float" id="fig2">
<label>Figure 2</label>
<caption>
<p>Results of non-social feedback group that the chosen ratio of good decks was the trials number each block divided by the times of choosing C/D and the switch ratio was the trials number each block divided by the times of changes between good/bad decks. The chosen ratio of good decks increased by blocks significantly and the switch ratio decreased by blocks.</p>
</caption>
<graphic xlink:href="fpsyg-15-1292808-g002.tif"/>
</fig>
<p>In the social feedback group (<xref ref-type="fig" rid="fig3">Figure 3</xref>), a significant main effect of decision-making blocks on the chosen rate of good decks (C, D) was observed (<italic>F</italic> (3,447)&#x2009;=&#x2009;20.66, <italic>p</italic> &#x003C;&#x2009;0.001, &#x03B7;<italic><sub>p</sub></italic><sup>2</sup> =&#x2009;0.12). Bonferroni&#x2019;s multiple comparisons revealed that the chosen rate of good decks in block 4 was significantly higher than that in block 1 (<italic>p</italic> &#x003C;&#x2009;0.001), block 2 (<italic>p</italic> &#x003C;&#x2009;0.001), and block 3 (<italic>p</italic> =&#x2009;0.006), indicating that participants demonstrated a learning effect on the decks&#x2019; properties and an increase in the chosen rate of good decks as the decision-making process progressed. Additionally, a significant main effect of partner&#x2019;s identity (<italic>F</italic> (1, 149)&#x2009;=&#x2009;4.18, <italic>p</italic> =&#x2009;0.043, &#x03B7;<italic><sub>p</sub></italic><sup>2</sup> =&#x2009;0.03) and feedback type (<italic>F</italic> (1, 149)&#x2009;=&#x2009;11.73, <italic>p</italic> &#x003C;&#x2009;0.001, &#x03B7;<italic><sub>p</sub></italic><sup>2</sup> =&#x2009;0.07) was observed, with the chosen rate of good decks being significantly higher when the partner was an expert than a novice, and the chosen rate of good decks in effective feedback being significantly higher than that in random feedback. A marginal significant interaction effect was observed between feedback type and partner identity (<italic>F</italic> (1, 149)&#x2009;=&#x2009;3.58, <italic>p</italic> =&#x2009;0.06) that the chosen rate of good decks was significantly higher in valid group than in random group when the partner was an expert <italic>p</italic> &#x003C;&#x2009;0.001. When the partner was a novice, there was no significant difference between two feedback groups. The result on one-way ANOVA of group on the slope of chosen rate showed no significant difference on the slope, <italic>F</italic> (4, 191)&#x2009;=&#x2009;0.605, <italic>p</italic> =&#x2009;0.659.</p>
<fig position="float" id="fig3">
<label>Figure 3</label>
<caption>
<p>Results of social feedback groups that the chosen ratio of good decks increased by blocks significantly and the switch ratio decreased by blocks.</p>
</caption>
<graphic xlink:href="fpsyg-15-1292808-g003.tif"/>
</fig>
<p>Our results indicated that decision-making blocks had a significant effect on group switch rate (<italic>F</italic> (3,447)&#x2009;=&#x2009;7.08, <italic>p</italic>&#x2009;&#x003C;&#x2009;0.001, &#x03B7;<italic><sub>p</sub></italic><sup>2</sup>&#x2009;=&#x2009;0.05). Bonferroni&#x2019;s multiple comparisons showed that the group switch rate in block 4 was significantly lower than that in blocks 1 and 2 (<italic>p</italic>&#x2009;=&#x2009;0.015). This suggests that, as decision-making progresses, participants exhibit a decrease in group switch rate. Neither partner&#x2019;s identity (<italic>F</italic> (1, 149)&#x2009;=&#x2009;0.07, <italic>p</italic>&#x2009;=&#x2009;0.80) nor feedback type (<italic>F</italic> (1, 149)&#x2009;=&#x2009;2.13, <italic>p</italic>&#x2009;=&#x2009;0.15) had a significant main effect, and there was no significant interaction between the two (<italic>F</italic> (1, 149)&#x2009;=&#x2009;0.169<italic>, p</italic>&#x2009;=&#x2009;0.682).</p>
</sec>
<sec id="sec9">
<label>3.2</label>
<title>Model comparison</title>
<p>An analysis of the model performance between the PVL-delta model, VPP model and ORL model with the data of non-social and social feedback groups, as shown in <xref ref-type="table" rid="tab2">Table 2</xref>, demonstrates that the ORL model is the best fit.</p>
<table-wrap position="float" id="tab2">
<label>Table 2</label>
<caption>
<p>Results of model comparison.</p>
</caption>
<table frame="hsides" rules="groups">
<thead>
<tr>
<th/>
<th align="center" valign="top" colspan="3">LOOIC</th>
</tr>
<tr>
<th/>
<th align="center" valign="top">PVL-delta</th>
<th align="center" valign="top">VPP</th>
<th align="center" valign="top">ORL</th>
</tr>
</thead>
<tbody>
<tr>
<td align="left" valign="top">Non-social</td>
<td align="center" valign="top">12215.56</td>
<td align="center" valign="top">11281.95</td>
<td align="center" valign="top">11251.08</td>
</tr>
<tr>
<td align="left" valign="top">Novice-random</td>
<td align="center" valign="top">13172.05</td>
<td align="center" valign="top">12406.50</td>
<td align="center" valign="top">12285.86</td>
</tr>
<tr>
<td align="left" valign="top">Novice-effective</td>
<td align="center" valign="top">11614.71</td>
<td align="center" valign="top">10786.92</td>
<td align="center" valign="top">10729.26</td>
</tr>
<tr>
<td align="left" valign="top">Expert-random</td>
<td align="center" valign="top">11850.38</td>
<td align="center" valign="top">10962.58</td>
<td align="center" valign="top">10922.58</td>
</tr>
<tr>
<td align="left" valign="top">Expert-effective</td>
<td align="center" valign="top">11205.61</td>
<td align="center" valign="top">10740.78</td>
<td align="center" valign="top">10691.33</td>
</tr>
</tbody>
</table>
</table-wrap>
</sec>
<sec id="sec10">
<label>3.3</label>
<title>Parameter analysis</title>
<p>The comparison of the posterior distribution of mean differences between non-social feedback group and each social feedback group showed that the A<sub>rew</sub> and A<sub>pun</sub> of the non-social feedback group were significantly higher than those of the social feedback group, as <xref ref-type="fig" rid="fig4">Figure 4</xref> and <xref ref-type="table" rid="tab3">Table 3</xref> show, with the HDI differences of A<sub>rew</sub> and A<sub>pun</sub> between the two groups being distributed away from zero. Additionally, the K and &#x03B2;<sub>F</sub> of the expert-effective group were significantly higher than those of the non-social feedback group, with the HDI differences of K and &#x03B2;<sub>F</sub> between the two groups also being distributed away from zero.</p>
<fig position="float" id="fig4">
<label>Figure 4</label>
<caption>
<p>HDI differences of parameters between non-social and social feedback conditions.</p>
</caption>
<graphic xlink:href="fpsyg-15-1292808-g004.tif"/>
</fig>
<table-wrap position="float" id="tab3">
<label>Table 3</label>
<caption>
<p>Differences of the posterior distribution of parameters mean between non-social and social condition (HDI).</p>
</caption>
<table frame="hsides" rules="groups">
<thead>
<tr>
<th/>
<th align="center" valign="top" colspan="5">Difference with non-social group</th>
</tr>
<tr>
<th/>
<th align="center" valign="top">A<sub>rew</sub></th>
<th align="center" valign="top">A<sub>pun</sub></th>
<th align="center" valign="top">K</th>
<th align="center" valign="top">&#x03B2;<sub>P</sub></th>
<th align="center" valign="top">&#x03B2;<sub>F</sub></th>
</tr>
</thead>
<tbody>
<tr>
<td align="left" valign="top">Novice-random</td>
<td align="center" valign="middle">[&#x2212;0.523, &#x2212;0.210]</td>
<td align="center" valign="middle">[&#x2212;0.267, &#x2212;0.047]</td>
<td align="center" valign="middle">[&#x2212;0.492,0.032]</td>
<td align="center" valign="middle">[&#x2212;1.131,0.957]</td>
<td align="center" valign="middle">[&#x2212;0.220, 0.870]</td>
</tr>
<tr>
<td align="left" valign="top">Novice-effective</td>
<td align="center" valign="middle">[&#x2212;0.469, &#x2212;0.139]</td>
<td align="center" valign="middle">[&#x2212;0.256, &#x2212;0.034]</td>
<td align="center" valign="middle">[&#x2212;0.351, 0.458]</td>
<td align="center" valign="middle">[&#x2212;0.679, 1.529]</td>
<td align="center" valign="middle">[&#x2212;0.157, 0.934]</td>
</tr>
<tr>
<td align="left" valign="top">Expert-random</td>
<td align="center" valign="middle">[&#x2212;0.549, &#x2212;0.261]</td>
<td align="center" valign="middle">[&#x2212;0.321, &#x2212;0.133]</td>
<td align="center" valign="middle">[&#x2212;0.045, 0.877]</td>
<td align="center" valign="middle">[&#x2212;0.371, 2.360]</td>
<td align="center" valign="middle">[&#x2212;0.575, 0.518]</td>
</tr>
<tr>
<td align="left" valign="top">Expert-effective</td>
<td align="center" valign="middle">[&#x2212;0.549, &#x2212;0.261]</td>
<td align="center" valign="middle">[&#x2212;0.285, &#x2212;0.071]</td>
<td align="center" valign="middle">[1.545,4.457]</td>
<td align="center" valign="middle">[&#x2212;0.371, 2.360]</td>
<td align="center" valign="middle">[0.213,1.456]</td>
</tr>
</tbody>
</table>
</table-wrap>
<p>A between-subjects ANOVA analysis was conducted for the social feedback condition, with the results shown in <xref ref-type="fig" rid="fig5">Figure 5</xref> and <xref ref-type="table" rid="tab4">Table 4</xref>. The results revealed a significant main effect of partner&#x2019;s identity (<italic>F</italic> (1, 153)&#x2009;=&#x2009;65.67, <italic>p</italic>&#x2009;&#x003C;&#x2009;0.001, &#x03B7;<italic><sub>p</sub></italic><sup>2</sup>&#x2009;=&#x2009;0.30) on A<sub>rew</sub>, but no significant main effect of feedback type (<italic>F</italic> (1, 153)&#x2009;=&#x2009;1.97, <italic>p</italic>&#x2009;=&#x2009;0.16). Additionally, a significant interaction effect of partner&#x2019;s identity &#x00D7; feedback type was observed (<italic>F</italic> (1, 153)&#x2009;=&#x2009;65.89, <italic>p</italic>&#x2009;&#x003C;&#x2009;0.001, &#x03B7;<italic><sub>p</sub></italic><sup>2</sup>&#x2009;=&#x2009;0.31). Further simple effect analysis indicated that A<sub>rew</sub> of novices was significantly higher than that of experts in effective feedback (<italic>F</italic> (1, 152)&#x2009;=&#x2009;127.65, <italic>p</italic>&#x2009;&#x003C;&#x2009;0.001, &#x03B7;<italic><sub>p</sub></italic><sup>2</sup>&#x2009;=&#x2009;0.46), but there was no significant difference between novice and expert when in random feedback (<italic>F</italic> (1, 152)&#x2009;=&#x2009;0.00, <italic>p</italic>&#x2009;=&#x2009;0.96).</p>
<fig position="float" id="fig5">
<label>Figure 5</label>
<caption>
<p>Results of ANOVA in social feedback groups.</p>
</caption>
<graphic xlink:href="fpsyg-15-1292808-g005.tif"/>
</fig>
<table-wrap position="float" id="tab4">
<label>Table 4</label>
<caption>
<p>Values of parameters in social condition.</p>
</caption>
<table frame="hsides" rules="groups">
<thead>
<tr>
<th align="left" valign="top">Identity</th>
<th align="center" valign="top">Type</th>
<th align="center" valign="top">A<sub>rew</sub></th>
<th align="center" valign="top">A<sub>pun</sub></th>
<th align="center" valign="top">K</th>
<th align="center" valign="top">&#x03B2;<sub>F</sub></th>
<th align="center" valign="top">&#x03B2;<sub>P</sub></th>
</tr>
</thead>
<tbody>
<tr>
<td align="left" valign="middle" rowspan="2">Novice</td>
<td align="center" valign="middle">Random</td>
<td align="center" valign="middle">0.27&#x2009;&#x00B1;&#x2009;0.08</td>
<td align="center" valign="middle">0.21&#x2009;&#x00B1;&#x2009;0.15</td>
<td align="center" valign="middle">0.54&#x2009;&#x00B1;&#x2009;0.36</td>
<td align="center" valign="middle">1.69&#x2009;&#x00B1;&#x2009;0.84</td>
<td align="center" valign="middle">&#x2212;0.84&#x2009;&#x00B1;&#x2009;2.44</td>
</tr>
<tr>
<td align="center" valign="middle">Effective</td>
<td align="center" valign="middle">0.35&#x2009;&#x00B1;&#x2009;0.06</td>
<td align="center" valign="middle">0.24&#x2009;&#x00B1;&#x2009;0.19</td>
<td align="center" valign="middle">0.73&#x2009;&#x00B1;&#x2009;0.37</td>
<td align="center" valign="middle">1.72&#x2009;&#x00B1;&#x2009;0.85</td>
<td align="center" valign="middle">&#x2212;0.49&#x2009;&#x00B1;&#x2009;2.20</td>
</tr>
<tr>
<td align="left" valign="middle" rowspan="2">Expert</td>
<td align="center" valign="middle">Random</td>
<td align="center" valign="middle">0.27&#x2009;&#x00B1;&#x2009;0.07</td>
<td align="center" valign="middle">0.13&#x2009;&#x00B1;&#x2009;0.08</td>
<td align="center" valign="middle">0.95&#x2009;&#x00B1;&#x2009;0.35</td>
<td align="center" valign="middle">1.39&#x2009;&#x00B1;&#x2009;0.92</td>
<td align="center" valign="middle">0.36&#x2009;&#x00B1;&#x2009;4.06</td>
</tr>
<tr>
<td align="center" valign="middle">Effective</td>
<td align="center" valign="middle">0.15&#x2009;&#x00B1;&#x2009;0.10</td>
<td align="center" valign="middle">0.18&#x2009;&#x00B1;&#x2009;0.12</td>
<td align="center" valign="middle">2.45&#x2009;&#x00B1;&#x2009;0.47</td>
<td align="center" valign="middle">2.04&#x2009;&#x00B1;&#x2009;0.64</td>
<td align="center" valign="middle">7.03&#x2009;&#x00B1;&#x2009;11.95</td>
</tr>
</tbody>
</table>
</table-wrap>
<p>Results revealed a significant main effect of partner&#x2019;s identity on A<sub>pun</sub> parameters (<italic>F</italic> (1, 153)&#x2009;=&#x2009;8.87, <italic>p</italic>&#x2009;=&#x2009;0.003, &#x03B7;<italic><sub>p</sub></italic><sup>2</sup>&#x2009;=&#x2009;0.06), with novice A<sub>pun</sub> being higher than that of expert. The main effect of feedback types was not significant (<italic>F</italic> (1, 153)&#x2009;=&#x2009;3.65, <italic>p</italic>&#x2009;=&#x2009;0.06), and no interaction effect between feedback type and partner&#x2019;s identity was observed (<italic>F</italic> (1, 153)&#x2009;=&#x2009;0.11, <italic>p</italic>&#x2009;=&#x2009;0.74).</p>
<p>Analysis of K parameters revealed a significant main effect of partner&#x2019;s identity (<italic>F</italic> (1, 153)&#x2009;=&#x2009;292.04, <italic>p</italic>&#x2009;&#x003C;&#x2009;0.001, &#x03B7;<italic><sub>p</sub></italic><sup>2</sup>&#x2009;=&#x2009;0.66) and feedback type (<italic>F</italic> (1, 153)&#x2009;=&#x2009;183.44, <italic>p</italic>&#x2009;&#x003C;&#x2009;0.001, &#x03B7;<italic><sub>p</sub></italic><sup>2</sup>&#x2009;=&#x2009;0.55), in addition to a significant interaction effect of partner&#x2019;s identity &#x00D7; feedback type (<italic>F</italic> (1, 153)&#x2009;=&#x2009;112.45, <italic>p</italic>&#x2009;&#x003C;&#x2009;0.001, &#x03B7;<italic><sub>p</sub></italic><sup>2</sup>&#x2009;=&#x2009;0.43). Further examination indicated that <italic>K</italic> values were significantly higher when the partner was an expert and the feedback was effective, compared to when it was random (<italic>F</italic> (1, 152)&#x2009;=&#x2009;96.21, <italic>p</italic>&#x2009;&#x003C;&#x2009;0.001, &#x03B7;<italic><sub>p</sub></italic><sup>2</sup>&#x2009;=&#x2009;0.39). However, there was no significant difference between novice and expert when both effective and random feedback was used (<italic>F</italic> (1, 152)&#x2009;=&#x2009;2.80, <italic>p</italic>&#x2009;=&#x2009;0.10).</p>
<p>Results revealed a significant main effect of feedback type (<italic>F</italic> (1, 153)&#x2009;=&#x2009;6.66, <italic>p</italic>&#x2009;=&#x2009;0.011, &#x03B7;<italic><sub>p</sub></italic><sup>2</sup>&#x2009;=&#x2009;0.04) on &#x03B2;<sub>F</sub>. However, the main effect of partner&#x2019;s identity was not significant (<italic>F</italic> (1, 153)&#x2009;=&#x2009;0.00, <italic>p</italic>&#x2009;=&#x2009;0.95). Additionally, a significant interaction effect of partner&#x2019;s identity &#x00D7; feedback type was observed (<italic>F</italic> (1, 153)&#x2009;=&#x2009;5.56, <italic>p</italic>&#x2009;=&#x2009;0.020, &#x03B7;<italic><sub>p</sub></italic><sup>2</sup>&#x2009;=&#x2009;0.04). Subsequent simple effect analysis revealed that the &#x03B2;<sub>F</sub> of effective feedback was significantly higher than that of random feedback when the partner was an expert (<italic>F</italic> (1, 152)&#x2009;=&#x2009;11.91, <italic>p</italic>&#x2009;&#x003C;&#x2009;0.001, &#x03B7;<italic><sub>p</sub></italic><sup>2</sup>&#x2009;=&#x2009;0.07), but there was no significant difference between random feedback and effective feedback when the partner was a novice (<italic>F</italic> (1, 152)&#x2009;=&#x2009;0.03, <italic>p</italic>&#x2009;=&#x2009;0.87).</p>
<p>A significant main effect of partner&#x2019;s identity (<italic>F</italic> (1, 153)&#x2009;=&#x2009;10.81, <italic>p</italic>&#x2009;&#x003C;&#x2009;0.001, &#x03B7;<italic><sub>p</sub></italic><sup>2</sup>&#x2009;=&#x2009;0.07) and feedback type (<italic>F</italic> (1, 153)&#x2009;=&#x2009;6.99, <italic>p</italic>&#x2009;=&#x2009;0.009, &#x03B7;<italic><sub>p</sub></italic><sup>2</sup>&#x2009;=&#x2009;0.05) was observed for &#x03B2;<sub>P</sub> parameters. Additionally, a significant interaction effect of partner&#x2019;s identity and feedback type was also seen (<italic>F</italic> (1, 153)&#x2009;=&#x2009;5.67, <italic>p</italic>&#x2009;=&#x2009;0.019, &#x03B7;<italic><sub>p</sub></italic><sup>2</sup>&#x2009;=&#x2009;0.04). Subsequent simple effect analysis revealed that the &#x03B2;<sub>P</sub> for effective feedback was higher than that of random feedback when the partner was an expert (<italic>F</italic> (1, 152)&#x2009;=&#x2009;11.49, <italic>p</italic>&#x2009;&#x003C;&#x2009;0.001, &#x03B7;<italic><sub>p</sub></italic><sup>2</sup>&#x2009;=&#x2009;0.07), however, there was no significant difference between random feedback and effective feedback when the partner was a novice (<italic>F</italic> (1, 152)&#x2009;=&#x2009;0.10, <italic>p</italic>&#x2009;=&#x2009;0.75).</p>
</sec>
</sec>
<sec sec-type="discussion" id="sec11">
<label>4</label>
<title>Discussion</title>
<p>This study employed the Iowa Gambling Task (IGT) to examine the impact of social feedback on economic feedback. We utilized the IGT with and without social feedback and evaluated three computational models, finding that the Outcome-Representation Learning (ORL) model displayed the most successful performance in all five conditions. Subsequently, we explored the effects of the identity of the feedback provider and the type of feedback on learning behavior and cognitive process. The results indicated that the chosen rate of good decks was affected by the identity and type of feedback, respectively. Moreover, the parameters in the ORL model were differently impacted by identity, type, and the interaction between them.</p>
<p>Consistent with previous studies on the IGT, participants in a non-social feedback setting showed a significant difference in the ratio of chosen good decks across the blocks. As the experiment progressed, a gradual learning of the characteristics of the cards was observed, with an increased preference for the good decks (<xref ref-type="bibr" rid="ref4">Bechara et al., 1994</xref>; <xref ref-type="bibr" rid="ref6">Cassotti et al., 2014</xref>; <xref ref-type="bibr" rid="ref41">Zhang et al., 2022</xref>). However, contrary to <xref ref-type="bibr" rid="ref4">Bechara et al.&#x2019;s (1994)</xref> hypothesis that the switch between options would become less frequent as the experiment went on, the rate of switching between the good and bad decks, as well as between decks within each category, showed no significant change by the end of the experiment, suggesting that the persistence of choice remained constant. This result is not unusual in previous studies, <xref ref-type="bibr" rid="ref35">Steingroever et al. (2012)</xref> reviewed studies that used the original or modified versions of the IGT and found that participants did not demonstrate a systematic decrease in the number of switches across trials.</p>
<p>In the social feedback setting of the IGT task, feedback providers were divided into novices and experts and feedback type was divided into random and effective feedback, in order to explore the influence of feedback type and provider identity on learning. Results showed that participants gradually favored the good card decks, indicating that they had learned the characteristics of the card decks. Furthermore, the feedback provider&#x2019;s identity and type had an effect on the selection ratio of the good decks, with the expert feedback group and the effective feedback group selecting the good decks significantly more than the novice feedback group and the random feedback group, respectively. Additionally, a marginal significant interaction effect was observed between identity and type, indicating that participants in the expert group were more likely to select good decks in the effective feedback group than in the random feedback group. This indicated that the subjects pay more attention to the feedback of experts, but they do not blindly follow the feedback of experts. Only effective feedback of experts can significantly increase the learning of the subjects. If feedback providers are novice, the subjects will not pay much attention to their feedback, so whether their feedback is effective or not, the difference in deck selection is not significant. It&#x2019;s worth noting that the slope of chosen rate on good decks did not differ across five groups. This suggested that, based on the current task (IGT) and two types of social feedback (approving or disapproving), while effective social feedback can lead to an overall improvement in performance, it does not accelerate the learning process. However, it remains possible that social feedback in a different learning task or under varied social feedback conditions could accelerate learning.</p>
<p>The switch rate between the good and bad decks in the social feedback setting was significantly impacted by the decision block. As the experiment progressed, the switch rate between the two decks decreased significantly. Participants, at first, tended to explore to alleviate their uncertainties in beliefs, as demonstrated by their higher rate of choice switching in block 1 and block 2 compared to block 4. When they had gathered enough information, they then proceeded to exploit it (<xref ref-type="bibr" rid="ref24">Hofmans and van den Bos, 2022</xref>). There was no difference between the four groups, indicating that the behavioral choices of the four groups were gradually becoming stable.</p>
<p>The result of model comparison revealed that the ORL model was the best-performing model in five groups after fitting the data in the PVL-delta, VPP, and ORL models and comparing the results. Theoretically, according to the ORL model, participants in the IGT learned the valence of the options (A<sub>rew</sub> and A<sub>pun</sub>), deliberated on the effect of the loss probability of the options (&#x03B2;<sub>F</sub>), and showed an inclination to persist with their prior decisions (&#x03B2;<sub>P</sub>). Meanwhile, individuals exhibited variance in their recollection of their deck selection (K).</p>
<p>A<sub>rew</sub> and A<sub>pun</sub>, the computational model parameters, are reflective of the participants&#x2019; learning degree on the current outcome of gains and losses decks. The comparison of the posterior distribution of mean differences between non-social feedback group and each social feedback group showed that compared to the non-social feedback group, the four social feedback groups exhibited lower rates of gains and losses learning. Furthermore, the gains learning rate (A<sub>rew</sub>) of the participants in the non-social feedback group was significantly higher than that of the expert feedback group in the effective feedback group, and the losses learning rate (A<sub>pun</sub>) of the novice feedback group was significantly higher than that of the expert feedback group regardless of effective or random feedback. The evidence indicated that in the absence of effective feedback, individuals displayed an increased weight of value of recent outcomes on the value update.</p>
<p>Previous studies have yielded inconsistent results regarding the relationship between learning rate and task performance. <xref ref-type="bibr" rid="ref10">Cutler et al. (2021)</xref> found that individuals with higher learning rates performed better in reinforcement learning tasks when conducted in young and elderly groups under different reward recipient conditions. Conversely, <xref ref-type="bibr" rid="ref39">Westhoff et al. (2021)</xref> observed that the learning rate decreased with age and task performance improved in probabilistic reinforcement learning tasks among children and adolescents. These divergent findings can be attributed to the uncertainty of gains and losses in the experimental environment. A lower learning rate in a stable yet ambiguous environment allows for better comprehension of environmental information, while a higher learning rate in a changing environment helps capture large fluctuations in the value of options. The task in this study resembled a stable environment (<xref ref-type="bibr" rid="ref18">Hayes and Wedell, 2020a</xref>,<xref ref-type="bibr" rid="ref19">b</xref>), suggesting that the subjects&#x2019; low learning rate likely contributes to their enhanced performance. In addition, this study incorporated two types of feedback, economic feedback (gain or loss) and social feedback (approving or disapproving), however, only the learning of economic feedback is included in the model. It is also possible that effective social feedback could lead subjects to learn from both social feedback and economic feedback (<xref ref-type="bibr" rid="ref24">Hofmans and van den Bos, 2022</xref>), potentially resulting in a decrease in the learning rate of economic feedback. However, this hypothesis requires further investigation.</p>
<p>In the task, the frequency of losses varies for each deck of cards, and the computational model parameter &#x03B2;F indicates how much the outcome frequency influences the participants&#x2019; evaluation of options (<xref ref-type="bibr" rid="ref16">Haines et al., 2018</xref>). Parameter K reflects the influence of preceding trials (<xref ref-type="bibr" rid="ref16">Haines et al., 2018</xref>). A higher K in the expert-effective group implies that participants are considering more recent options. The results of the study showed that the &#x03B2;<sub>F</sub> and K parameters in the expert-effective feedback group were significantly higher than those in the non-social feedback and expert-random feedback groups, respectively. This suggests that participants were more likely to consider win frequency across trials and more recent options when provided with effective guidance (<xref ref-type="bibr" rid="ref16">Haines et al., 2018</xref>). Additionally, the &#x03B2;<sub>P</sub> parameter in the expert-effective group was significantly higher than that in the expert-random feedback group, indicating that participants had a greater degree of persistence in the process of option value formation when provided with effective feedback. As experts provided feedback, learners verified its effectiveness, leading to discrepancies between expert-effective feedback and expert-random feedback.</p>
<p>The results of this study indicated that there was no significant difference between the effective and random groups in the novice feedback group for the three parameters, &#x03B2;<sub>F</sub>, &#x03B2;<sub>P</sub> and K. <xref ref-type="bibr" rid="ref38">V&#x00E9;lez and Gweon (2021)</xref> postulates that in the process of social learning, individuals not only process the information itself, but also assess the agent providing the information. If the content or accuracy of the information aligns with the identity of the agent, the individual&#x2019;s evaluation of the agent increases and the weight of the information provided is amplified. Conversely, if the agent is deemed to be a novice, the participant may deem the feedback to be less informative, thus reducing the weight of the information provided. This study demonstrated that participants formed expectations for the effectiveness of feedback based on the peer&#x2019;s past knowledge and experience, and when the peer was a novice, the participants thought that their feedback might not be very informative. Even if the peer provided effective feedback, these three parameters were still little affected.</p>
<p>Results of the analysis of the ratio of chosen good decks and the three parameters of &#x03B2;<sub>F</sub>, &#x03B2;<sub>P</sub> and K revealed an interaction effect of identity and type. It was observed that participants&#x2019; perception of the feedback providers (whether they were experts or not) had an influence on the extent to which they considered the opinion and evaluated the effectiveness of the feedback. If they found that the opinions of experts were ineffective, they would reduce the influence of social feedback. This can be explained by the &#x2018;when&#x2019; strategy of SLS, which suggests that when participants lack sufficient information to make optimal decisions in the IGT, they tend to rely on information from others, especially in uncertain situations. Additionally, the &#x2018;who&#x2019; strategy, which entails taking cues from individuals who are more knowledgeable or experienced with the task, may also play a significant role (<xref ref-type="bibr" rid="ref32">Olsson et al., 2020</xref>).</p>
<p>This study has certain limitations that should be noted. Firstly, in this study, we used two kinds of feedback, economic feedback and social feedback, and subjects would consider both kinds of feedback to determine their behavior during IGT tasks. However, the ORL model did not incorporate social feedback. Future research could design various models that incorporate social feedback to reveal how people integrate them. Secondly, in our experiment, the ratio of positive and negative feedback is 80:20 in all social feedback groups. However, in the effective feedback group, the average rate of good decks was less than 60% in the whole task, so the positive feedback ratio of subjects in the effective feedback group was generally lower than 80%, which would cause the imbalanced frequencies of positive feedback between the random feedback group and the effective feedback group. Because social feedback could provide a positive feeling (<xref ref-type="bibr" rid="ref22">Ho et al., 2019</xref>), a higher ratio of positive feedback in the random group may lead to stronger positive feelings among participants in that group than in the effective feedback group. Third, the feedback, whether in the random or effective group, is pseudo-social and constant throughout the experiment, potentially limiting its credibility. Further studies could use models to establish the behavior pattern of feedback that simulates real feedback, or explore the real two-person task scenario to update parameters within a one-person computational model. Fourthly, the sex ratio of the participants was unbalanced, with more women than men, thus it was not possible to investigate whether gender had an effect on learning differences. Lastly, this study investigated the impact of peer feedback in terms of behavioral performance and computational model parameters, without considering the influence of individual subjective feelings and individual differences. Future experiments should therefore include the measurement of subjective feelings such as subjective engagement and trust in peers, as well as individual characteristics.</p>
</sec>
<sec sec-type="data-availability" id="sec12">
<title>Data availability statement</title>
<p>The raw data supporting the conclusions of this article will be made available by the authors, without undue reservation.</p>
</sec>
<sec sec-type="ethics-statement" id="sec13">
<title>Ethics statement</title>
<p>The studies involving humans were approved by Central China Normal University, Ethic Committee, EC, Institutional Review Board. The studies were conducted in accordance with the local legislation and institutional requirements. The participants provided their written informed consent to participate in this study.</p>
</sec>
<sec sec-type="author-contributions" id="sec14">
<title>Author contributions</title>
<p>MP: Conceptualization, Writing &#x2013; review &#x0026; editing, Methodology, Project administration, Resources, Supervision, Validation, Writing &#x2013; original draft. QD: Formal analysis, Methodology, Software, Writing &#x2013; original draft. XY: Methodology, Project administration, Writing &#x2013; original draft. RT: Methodology, Project administration, Writing &#x2013; original draft. LZ: Supervision, Writing &#x2013; review &#x0026; editing. HZ: Supervision, Writing &#x2013; review &#x0026; editing. XL: Writing &#x2013; review &#x0026; editing.</p>
</sec>
</body>
<back>
<sec sec-type="funding-information" id="sec15">
<title>Funding</title>
<p>The author(s) declare that no financial support was received for the research, authorship, and/or publication of this article.</p>
</sec>
<sec sec-type="COI-statement" id="sec16">
<title>Conflict of interest</title>
<p>The authors declare that the research was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
</sec>
<sec id="sec100" sec-type="disclaimer">
<title>Publisher&#x2019;s note</title>
<p>All claims expressed in this article are solely those of the authors and do not necessarily represent those of their affiliated organizations, or those of the publisher, the editors and the reviewers. Any product that may be evaluated in this article, or claim that may be made by its manufacturer, is not guaranteed or endorsed by the publisher.</p>
</sec>
<sec sec-type="supplementary-material" id="sec17">
<title>Supplementary material</title>
<p>The Supplementary material for this article can be found online at: <ext-link xlink:href="https://www.frontiersin.org/articles/10.3389/fpsyg.2024.1292808/full#supplementary-material" ext-link-type="uri">https://www.frontiersin.org/articles/10.3389/fpsyg.2024.1292808/full#supplementary-material</ext-link></p>
<supplementary-material xlink:href="Table_1.DOCX" id="SM1" mimetype="application/vnd.openxmlformats-officedocument.wordprocessingml.document" xmlns:xlink="http://www.w3.org/1999/xlink"/>
</sec>
<ref-list>
<title>References</title>
<ref id="ref1"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Agay</surname> <given-names>N.</given-names></name> <name><surname>Yechiam</surname> <given-names>E.</given-names></name> <name><surname>Carmel</surname> <given-names>Z.</given-names></name> <name><surname>Levkovitz</surname> <given-names>Y.</given-names></name></person-group> (<year>2010</year>). <article-title>Non-specific effects of methylphenidate (Ritalin) on cognitive ability and decision-making of ADHD and healthy adults</article-title>. <source>Psychopharmacology</source> <volume>210</volume>, <fpage>511</fpage>&#x2013;<lpage>519</lpage>. doi: <pub-id pub-id-type="doi">10.1007/s00213-010-1853-4</pub-id>, PMID: <pub-id pub-id-type="pmid">20424828</pub-id></citation></ref>
<ref id="ref2"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Ahn</surname> <given-names>W.-Y.</given-names></name> <name><surname>Busemeyer</surname> <given-names>J. R.</given-names></name> <name><surname>Wagenmakers</surname> <given-names>E.-J.</given-names></name> <name><surname>Stout</surname> <given-names>J. C.</given-names></name></person-group> (<year>2008</year>). <article-title>Comparison of decision learning models using the generalization criterion method</article-title>. <source>Cogn. Sci.</source> <volume>32</volume>, <fpage>1376</fpage>&#x2013;<lpage>1402</lpage>. doi: <pub-id pub-id-type="doi">10.1080/03640210802352992</pub-id>, PMID: <pub-id pub-id-type="pmid">21585458</pub-id></citation></ref>
<ref id="ref9003"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Ahn</surname> <given-names>W.-Y.</given-names></name> <name><surname>Haines</surname> <given-names>N.</given-names></name> <name><surname>Zhang</surname> <given-names>L.</given-names></name></person-group> (<year>2017</year>). <article-title>Revealing Neurocomputational Mechanisms of Reinforcement Learning and Decision-Making With the hBayesDM Package</article-title>. <source>Computational Psychiatry</source> <volume>1</volume>, <fpage>24</fpage>. doi: <pub-id pub-id-type="doi">10.1162/CPSY_a_00002</pub-id>, PMID: <pub-id pub-id-type="pmid">21585458</pub-id></citation></ref>
<ref id="ref3"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Ahn</surname> <given-names>W.-Y.</given-names></name> <name><surname>Vasilev</surname> <given-names>G.</given-names></name> <name><surname>Lee</surname> <given-names>S.-H.</given-names></name> <name><surname>Busemeyer</surname> <given-names>J. R.</given-names></name> <name><surname>Kruschke</surname> <given-names>J. K.</given-names></name> <name><surname>Bechara</surname> <given-names>A.</given-names></name> <etal/></person-group>. (<year>2014</year>). <article-title>Decision-making in stimulant and opiate addicts in protracted abstinence: evidence from computational modeling with pure users</article-title>. <source>Front. Psychol.</source> <volume>5</volume>:<fpage>849</fpage>. doi: <pub-id pub-id-type="doi">10.3389/fpsyg.2014.00849</pub-id>, PMID: <pub-id pub-id-type="pmid">25161631</pub-id></citation></ref>
<ref id="ref4"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Bechara</surname> <given-names>A.</given-names></name> <name><surname>Damasio</surname> <given-names>A. R.</given-names></name> <name><surname>Damasio</surname> <given-names>H.</given-names></name> <name><surname>Anderson</surname> <given-names>S. W.</given-names></name></person-group> (<year>1994</year>). <article-title>Insensitivity to future consequences following damage to human prefrontal cortex</article-title>. <source>Cognition</source> <volume>50</volume>, <fpage>7</fpage>&#x2013;<lpage>15</lpage>. doi: <pub-id pub-id-type="doi">10.1016/0010-0277(94)90018-3</pub-id>, PMID: <pub-id pub-id-type="pmid">8039375</pub-id></citation></ref>
<ref id="ref5"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Case</surname> <given-names>J. A. C.</given-names></name> <name><surname>Olino</surname> <given-names>T. M.</given-names></name></person-group> (<year>2020</year>). <article-title>Approach and avoidance patterns in reward learning across domains: an initial examination of the social Iowa gambling task</article-title>. <source>Behav. Res. Ther.</source> <volume>125</volume>:<fpage>103547</fpage>. doi: <pub-id pub-id-type="doi">10.1016/j.brat.2019.103547</pub-id>, PMID: <pub-id pub-id-type="pmid">31954996</pub-id></citation></ref>
<ref id="ref6"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Cassotti</surname> <given-names>M.</given-names></name> <name><surname>A&#x00EF;te</surname> <given-names>A.</given-names></name> <name><surname>Osmont</surname> <given-names>A.</given-names></name> <name><surname>Houd&#x00E9;</surname> <given-names>O.</given-names></name> <name><surname>Borst</surname> <given-names>G.</given-names></name></person-group> (<year>2014</year>). <article-title>What have we learned about the processes involved in the Iowa gambling task from developmental studies?</article-title> <source>Front. Psychol.</source> <volume>5</volume>:<fpage>915</fpage>. doi: <pub-id pub-id-type="doi">10.3389/fpsyg.2014.00915</pub-id>, PMID: <pub-id pub-id-type="pmid">25191295</pub-id></citation></ref>
<ref id="ref7"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Cauffman</surname> <given-names>E.</given-names></name> <name><surname>Shulman</surname> <given-names>E. P.</given-names></name> <name><surname>Steinberg</surname> <given-names>L.</given-names></name> <name><surname>Claus</surname> <given-names>E.</given-names></name> <name><surname>Banich</surname> <given-names>M. T.</given-names></name> <name><surname>Graham</surname> <given-names>S.</given-names></name> <etal/></person-group>. (<year>2010</year>). <article-title>Age differences in affective decision making as indexed by performance on the Iowa gambling task</article-title>. <source>Dev. Psychol.</source> <volume>46</volume>, <fpage>193</fpage>&#x2013;<lpage>207</lpage>. doi: <pub-id pub-id-type="doi">10.1037/a0016128</pub-id>, PMID: <pub-id pub-id-type="pmid">20053017</pub-id></citation></ref>
<ref id="ref8"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Charpentier</surname> <given-names>C. J.</given-names></name> <name><surname>Iigaya</surname> <given-names>K.</given-names></name> <name><surname>O&#x2019;Doherty</surname> <given-names>J. P.</given-names></name></person-group> (<year>2020</year>). <article-title>A neuro-computational account of arbitration between choice imitation and goal emulation during human observational learning</article-title>. <source>Neuron</source> <volume>106</volume>, <fpage>687</fpage>&#x2013;<lpage>699.e7</lpage>. doi: <pub-id pub-id-type="doi">10.1016/j.neuron.2020.02.028</pub-id>, PMID: <pub-id pub-id-type="pmid">32187528</pub-id></citation></ref>
<ref id="ref9"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Colombo</surname> <given-names>M.</given-names></name> <name><surname>Stankevicius</surname> <given-names>A.</given-names></name> <name><surname>Series</surname> <given-names>P.</given-names></name></person-group> (<year>2014</year>). <article-title>Benefits of social vs. non-social feedback on learning and generosity. Results from the tipping game</article-title>. <source>Front. Psychol.</source> <volume>5</volume>:<fpage>1154</fpage>. doi: <pub-id pub-id-type="doi">10.3389/fpsyg.2014.01154</pub-id>, PMID: <pub-id pub-id-type="pmid">25346715</pub-id></citation></ref>
<ref id="ref10"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Cutler</surname> <given-names>J.</given-names></name> <name><surname>Wittmann</surname> <given-names>M. K.</given-names></name> <name><surname>Abdurahman</surname> <given-names>A.</given-names></name> <name><surname>Hargitai</surname> <given-names>L. D.</given-names></name> <name><surname>Drew</surname> <given-names>D.</given-names></name> <name><surname>Husain</surname> <given-names>M.</given-names></name> <etal/></person-group>. (<year>2021</year>). <article-title>Ageing is associated with disrupted reinforcement learning whilst learning to help others is preserved</article-title>. <source>Nat. Commun.</source> <volume>12</volume>:<fpage>4440</fpage>. doi: <pub-id pub-id-type="doi">10.1038/s41467-021-24576-w</pub-id>, PMID: <pub-id pub-id-type="pmid">34290236</pub-id></citation></ref>
<ref id="ref12"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>De Houwer</surname> <given-names>J.</given-names></name> <name><surname>Barnes-Holmes</surname> <given-names>D.</given-names></name> <name><surname>Moors</surname> <given-names>A.</given-names></name></person-group> (<year>2013</year>). <article-title>What is learning? On the nature and merits of a functional definition of learning</article-title>. <source>Psychon. Bull. Rev.</source> <volume>20</volume>, <fpage>631</fpage>&#x2013;<lpage>642</lpage>. doi: <pub-id pub-id-type="doi">10.3758/s13423-013-0386-3</pub-id>, PMID: <pub-id pub-id-type="pmid">23359420</pub-id></citation></ref>
<ref id="ref13"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Faul</surname> <given-names>F.</given-names></name> <name><surname>Erdfelder</surname> <given-names>E.</given-names></name> <name><surname>Lang</surname> <given-names>A.-G.</given-names></name> <name><surname>Buchner</surname> <given-names>A.</given-names></name></person-group> (<year>2007</year>). <article-title>G&#x002A;power 3: a flexible statistical power analysis program for the social, behavioral, and biomedical sciences</article-title>. <source>Behav. Res. Methods</source> <volume>39</volume>, <fpage>175</fpage>&#x2013;<lpage>191</lpage>. doi: <pub-id pub-id-type="doi">10.3758/BF03193146</pub-id>, PMID: <pub-id pub-id-type="pmid">17695343</pub-id></citation></ref>
<ref id="ref14"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Garon</surname> <given-names>N. M.</given-names></name> <name><surname>English</surname> <given-names>S. D.</given-names></name></person-group> (<year>2021</year>). <article-title>Heterogeneity of decision-making strategies for preschoolers on a variant of the IGT</article-title>. <source>Appl. Neuropsychol. Child</source> <volume>11</volume>, <fpage>811</fpage>&#x2013;<lpage>824</lpage>. doi: <pub-id pub-id-type="doi">10.1080/21622965.2021.1973470</pub-id>, PMID: <pub-id pub-id-type="pmid">34505556</pub-id></citation></ref>
<ref id="ref15"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Gweon</surname> <given-names>H.</given-names></name></person-group> (<year>2021</year>). <article-title>Inferential social learning: cognitive foundations of human social learning and teaching</article-title>. <source>Trends Cogn. Sci.</source> <volume>25</volume>, <fpage>896</fpage>&#x2013;<lpage>910</lpage>. doi: <pub-id pub-id-type="doi">10.1016/j.tics.2021.07.008</pub-id>, PMID: <pub-id pub-id-type="pmid">34417094</pub-id></citation></ref>
<ref id="ref16"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Haines</surname> <given-names>N.</given-names></name> <name><surname>Vassileva</surname> <given-names>J.</given-names></name> <name><surname>Ahn</surname> <given-names>W.</given-names></name></person-group> (<year>2018</year>). <article-title>The outcome-representation learning model: a novel reinforcement learning model of the Iowa gambling task</article-title>. <source>Cogn. Sci.</source> <volume>42</volume>, <fpage>2534</fpage>&#x2013;<lpage>2561</lpage>. doi: <pub-id pub-id-type="doi">10.1111/cogs.12688</pub-id>, PMID: <pub-id pub-id-type="pmid">30289167</pub-id></citation></ref>
<ref id="ref17"><citation citation-type="book"><person-group person-group-type="author"><name><surname>Harris</surname> <given-names>P. L.</given-names></name></person-group> (<year>2012</year>). &#x201C;<article-title>Trusting what You&#x2019;re told: how children learn from others</article-title>&#x201D; in <source>Trusting what You&#x2019;re told</source> (<publisher-name>Harvard University Press</publisher-name>).</citation></ref>
<ref id="ref18"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Hayes</surname> <given-names>W. M.</given-names></name> <name><surname>Wedell</surname> <given-names>D. H.</given-names></name></person-group> (<year>2020a</year>). <article-title>Autonomic responses to choice outcomes: links to task performance and reinforcement-learning parameters</article-title>. <source>Biol. Psychol.</source> <volume>156</volume>:<fpage>107968</fpage>. doi: <pub-id pub-id-type="doi">10.1016/j.biopsycho.2020.107968</pub-id>, PMID: <pub-id pub-id-type="pmid">33027684</pub-id></citation></ref>
<ref id="ref19"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Hayes</surname> <given-names>W. M.</given-names></name> <name><surname>Wedell</surname> <given-names>D. H.</given-names></name></person-group> (<year>2020b</year>). <article-title>Modeling the role of feelings in the Iowa gambling task</article-title>. <source>Decision</source> <volume>7</volume>, <fpage>67</fpage>&#x2013;<lpage>89</lpage>. doi: <pub-id pub-id-type="doi">10.1037/dec0000116</pub-id></citation></ref>
<ref id="ref20"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Hertz</surname> <given-names>U.</given-names></name> <name><surname>Bell</surname> <given-names>V.</given-names></name> <name><surname>Raihani</surname> <given-names>N.</given-names></name></person-group> (<year>2021</year>). <article-title>Trusting and learning from others: immediate and long-term effects of learning from observation and advice</article-title>. <source>Proc. R. Soc. B Biol. Sci.</source> <volume>288</volume>:<fpage>20211414</fpage>. doi: <pub-id pub-id-type="doi">10.1098/rspb.2021.1414</pub-id>, PMID: <pub-id pub-id-type="pmid">34666522</pub-id></citation></ref>
<ref id="ref21"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Heyes</surname> <given-names>C.</given-names></name></person-group> (<year>2012</year>). <article-title>What&#x2019;s social about social learning?</article-title> <source>J. Comp. Psychol.</source> <volume>126</volume>, <fpage>193</fpage>&#x2013;<lpage>202</lpage>. doi: <pub-id pub-id-type="doi">10.1037/a0025180</pub-id></citation></ref>
<ref id="ref22"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Ho</surname> <given-names>M. K.</given-names></name> <name><surname>Cushman</surname> <given-names>F.</given-names></name> <name><surname>Littman</surname> <given-names>M. L.</given-names></name> <name><surname>Austerweil</surname> <given-names>J. L.</given-names></name></person-group> (<year>2019</year>). <article-title>People teach with rewards and punishments as communication, not reinforcements</article-title>. <source>J. Exp. Psychol. Gen.</source> <volume>148</volume>, <fpage>520</fpage>&#x2013;<lpage>549</lpage>. doi: <pub-id pub-id-type="doi">10.1037/xge0000569</pub-id>, PMID: <pub-id pub-id-type="pmid">30802127</pub-id></citation></ref>
<ref id="ref23"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Ho</surname> <given-names>M. K.</given-names></name> <name><surname>MacGlashan</surname> <given-names>J.</given-names></name> <name><surname>Littman</surname> <given-names>M. L.</given-names></name> <name><surname>Cushman</surname> <given-names>F.</given-names></name></person-group> (<year>2017</year>). <article-title>Social is special: a normative framework for teaching with and learning from evaluative feedback</article-title>. <source>Cognition</source> <volume>167</volume>, <fpage>91</fpage>&#x2013;<lpage>106</lpage>. doi: <pub-id pub-id-type="doi">10.1016/j.cognition.2017.03.006</pub-id>, PMID: <pub-id pub-id-type="pmid">28341268</pub-id></citation></ref>
<ref id="ref24"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Hofmans</surname> <given-names>L.</given-names></name> <name><surname>van den Bos</surname> <given-names>W.</given-names></name></person-group> (<year>2022</year>). <article-title>Social learning across adolescence: a Bayesian neurocognitive perspective</article-title>. <source>Dev. Cogn. Neurosci.</source> <volume>58</volume>, <fpage>101151</fpage>&#x2013;<lpage>101114</lpage>. doi: <pub-id pub-id-type="doi">10.1016/j.dcn.2022.101151</pub-id>, PMID: <pub-id pub-id-type="pmid">36183664</pub-id></citation></ref>
<ref id="ref25"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Izuma</surname> <given-names>K.</given-names></name> <name><surname>Saito</surname> <given-names>D. N.</given-names></name> <name><surname>Sadato</surname> <given-names>N.</given-names></name></person-group> (<year>2008</year>). <article-title>Processing of social and monetary rewards in the human striatum</article-title>. <source>Neuron</source> <volume>58</volume>, <fpage>284</fpage>&#x2013;<lpage>294</lpage>. doi: <pub-id pub-id-type="doi">10.1016/j.neuron.2008.03.020</pub-id></citation></ref>
<ref id="ref26"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Kendal</surname> <given-names>R. L.</given-names></name> <name><surname>Boogert</surname> <given-names>N. J.</given-names></name> <name><surname>Rendell</surname> <given-names>L.</given-names></name> <name><surname>Laland</surname> <given-names>K. N.</given-names></name> <name><surname>Webster</surname> <given-names>M.</given-names></name> <name><surname>Jones</surname> <given-names>P. L.</given-names></name></person-group> (<year>2018</year>). <article-title>Social learning strategies: bridge-building between fields</article-title>. <source>Trends Cogn. Sci.</source> <volume>22</volume>, <fpage>651</fpage>&#x2013;<lpage>665</lpage>. doi: <pub-id pub-id-type="doi">10.1016/j.tics.2018.04.003</pub-id>, PMID: <pub-id pub-id-type="pmid">29759889</pub-id></citation></ref>
<ref id="ref27"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Laland</surname> <given-names>K. N.</given-names></name></person-group> (<year>2004</year>). <article-title>Social learning strategies</article-title>. <source>Anim. Learn. Behav.</source> <volume>32</volume>, <fpage>4</fpage>&#x2013;<lpage>14</lpage>. doi: <pub-id pub-id-type="doi">10.3758/BF03196002</pub-id></citation></ref>
<ref id="ref28"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Lin</surname> <given-names>A.</given-names></name> <name><surname>Adolphs</surname> <given-names>R.</given-names></name> <name><surname>Rangel</surname> <given-names>A.</given-names></name></person-group> (<year>2012</year>). <article-title>Social and monetary reward learning engage overlapping neural substrates</article-title>. <source>Soc. Cogn. Affect. Neurosci.</source> <volume>7</volume>, <fpage>274</fpage>&#x2013;<lpage>281</lpage>. doi: <pub-id pub-id-type="doi">10.1093/scan/nsr006</pub-id>, PMID: <pub-id pub-id-type="pmid">21427193</pub-id></citation></ref>
<ref id="ref29"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Mukherjee</surname> <given-names>D.</given-names></name> <name><surname>Kable</surname> <given-names>J. W.</given-names></name></person-group> (<year>2014</year>). <article-title>Value-based decision making in mental illness: a meta-analysis</article-title>. <source>Clin. Psychol. Sci.</source> <volume>2</volume>, <fpage>767</fpage>&#x2013;<lpage>782</lpage>. doi: <pub-id pub-id-type="doi">10.1177/2167702614531580</pub-id></citation></ref>
<ref id="ref30"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Must</surname> <given-names>A.</given-names></name> <name><surname>Szab&#x00F3;</surname> <given-names>Z.</given-names></name> <name><surname>B&#x00F3;di</surname> <given-names>N.</given-names></name> <name><surname>Sz&#x00E1;sz</surname> <given-names>A.</given-names></name> <name><surname>Janka</surname> <given-names>Z.</given-names></name> <name><surname>K&#x00E9;ri</surname> <given-names>S.</given-names></name></person-group> (<year>2006</year>). <article-title>Sensitivity to reward and punishment and the prefrontal cortex in major depression</article-title>. <source>J. Affect. Disord.</source> <volume>90</volume>, <fpage>209</fpage>&#x2013;<lpage>215</lpage>. doi: <pub-id pub-id-type="doi">10.1016/j.jad.2005.12.005</pub-id>, PMID: <pub-id pub-id-type="pmid">16412520</pub-id></citation></ref>
<ref id="ref31"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Namba</surname> <given-names>S.</given-names></name></person-group> (<year>2021</year>). <article-title>Feedback from facial expressions contribute to slow learning rate in an Iowa gambling task</article-title>. <source>Front. Psychol.</source> <volume>12</volume>:<fpage>684249</fpage>. doi: <pub-id pub-id-type="doi">10.3389/fpsyg.2021.684249</pub-id>, PMID: <pub-id pub-id-type="pmid">34434141</pub-id></citation></ref>
<ref id="ref32"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Olsson</surname> <given-names>A.</given-names></name> <name><surname>Knapska</surname> <given-names>E.</given-names></name> <name><surname>Lindstr&#x00F6;m</surname> <given-names>B.</given-names></name></person-group> (<year>2020</year>). <article-title>The neural and computational systems of social learning</article-title>. <source>Nat. Rev. Neurosci.</source> <volume>21</volume>, <fpage>197</fpage>&#x2013;<lpage>212</lpage>. doi: <pub-id pub-id-type="doi">10.1038/s41583-020-0276-4</pub-id>, PMID: <pub-id pub-id-type="pmid">32221497</pub-id></citation></ref>
<ref id="ref9001"><citation citation-type="book"><person-group person-group-type="author"><name><surname>Rescorla</surname> <given-names>R.</given-names></name> <name><surname>Wagner</surname> <given-names>A.</given-names></name></person-group> (<year>1972</year>). <article-title>A theory of Pavlovian conditioning: Variations in the effectiveness of reinforcement and nonreinforcement</article-title>. <source>In Classical Conditioning II: Current Research and Theory</source>, <fpage>64</fpage>&#x2013;<lpage>99</lpage>.</citation></ref>
<ref id="ref33"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Schindler</surname> <given-names>S.</given-names></name> <name><surname>Vormbrock</surname> <given-names>R.</given-names></name> <name><surname>Kissler</surname> <given-names>J.</given-names></name></person-group> (<year>2022</year>). <article-title>Encoding in a social feedback context enhances and biases behavioral and electrophysiological correlates of long-term recognition memory</article-title>. <source>Sci. Rep.</source> <volume>12</volume>:<fpage>3312</fpage>. doi: <pub-id pub-id-type="doi">10.1038/s41598-022-07270-9</pub-id>, PMID: <pub-id pub-id-type="pmid">35228604</pub-id></citation></ref>
<ref id="ref34"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Serrano</surname> <given-names>J. I.</given-names></name> <name><surname>Iglesias</surname> <given-names>&#x00C1;.</given-names></name> <name><surname>Woods</surname> <given-names>S. P.</given-names></name> <name><surname>del Castillo</surname> <given-names>M. D.</given-names></name></person-group> (<year>2022</year>). <article-title>A computational cognitive model of the Iowa gambling task for finely characterizing decision making in methamphetamine users</article-title>. <source>Expert Syst. Appl.</source> <volume>205</volume>:<fpage>117795</fpage>. doi: <pub-id pub-id-type="doi">10.1016/j.eswa.2022.117795</pub-id></citation></ref>
<ref id="ref35"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Steingroever</surname> <given-names>H.</given-names></name> <name><surname>Wetzels</surname> <given-names>R.</given-names></name> <name><surname>Horstmann</surname> <given-names>A.</given-names></name> <name><surname>Neumann</surname> <given-names>J.</given-names></name> <name><surname>Wagenmakers</surname> <given-names>E.-J.</given-names></name></person-group> (<year>2012</year>). <article-title>Performance of healthy participants on the Iowa gambling task</article-title>. <source>Psychol. Assess.</source> <volume>25</volume>, <fpage>180</fpage>&#x2013;<lpage>193</lpage>. doi: <pub-id pub-id-type="doi">10.1037/a0029929</pub-id></citation></ref>
<ref id="ref36"><citation citation-type="other"><person-group person-group-type="author"><name><surname>Thompson</surname> <given-names>J.</given-names></name> <name><surname>Westwater</surname> <given-names>M.</given-names></name></person-group> (<year>2017</year>). <article-title>Alpha EEG power reflects the suppression of Pavlovian bias during social reinforcement learning</article-title>. <comment>biorxiv</comment>. doi: <pub-id pub-id-type="doi">10.1101/153668</pub-id>,</citation></ref>
<ref id="ref37"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Van der Borght</surname> <given-names>L.</given-names></name> <name><surname>Schouppe</surname> <given-names>N.</given-names></name> <name><surname>Notebaert</surname> <given-names>W.</given-names></name></person-group> (<year>2016</year>). <article-title>Improved memory for error feedback</article-title>. <source>Psychol. Res.</source> <volume>80</volume>, <fpage>1049</fpage>&#x2013;<lpage>1058</lpage>. doi: <pub-id pub-id-type="doi">10.1007/s00426-015-0705-6</pub-id></citation></ref>
<ref id="ref38"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>V&#x00E9;lez</surname> <given-names>N.</given-names></name> <name><surname>Gweon</surname> <given-names>H.</given-names></name></person-group> (<year>2021</year>). <article-title>Learning from other minds: an optimistic critique of reinforcement learning models of social learning</article-title>. <source>Curr. Opin. Behav. Sci.</source> <volume>38</volume>, <fpage>110</fpage>&#x2013;<lpage>115</lpage>. doi: <pub-id pub-id-type="doi">10.1016/j.cobeha.2021.01.006</pub-id>, PMID: <pub-id pub-id-type="pmid">35321420</pub-id></citation></ref>
<ref id="ref39"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Westhoff</surname> <given-names>B.</given-names></name> <name><surname>Blankenstein</surname> <given-names>N. E.</given-names></name> <name><surname>Schreuders</surname> <given-names>E.</given-names></name> <name><surname>Crone</surname> <given-names>E. A.</given-names></name> <name><surname>van Duijvenvoorde</surname> <given-names>A. C. K.</given-names></name></person-group> (<year>2021</year>). <article-title>Increased ventromedial prefrontal cortex activity in adolescence benefits prosocial reinforcement learning</article-title>. <source>Dev. Cogn. Neurosci.</source> <volume>52</volume>:<fpage>101018</fpage>. doi: <pub-id pub-id-type="doi">10.1016/j.dcn.2021.101018</pub-id>, PMID: <pub-id pub-id-type="pmid">34678671</pub-id></citation></ref>
<ref id="ref40"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Zhang</surname> <given-names>L.</given-names></name> <name><surname>Gl&#x00E4;scher</surname> <given-names>J.</given-names></name></person-group> (<year>2020</year>). <article-title>A brain network supporting social influences in human decision-making</article-title>. <source>Sci. Adv.</source> <volume>6</volume>:<fpage>eabb4159</fpage>. doi: <pub-id pub-id-type="doi">10.1126/sciadv.abb4159</pub-id></citation></ref>
<ref id="ref41"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Zhang</surname> <given-names>H.</given-names></name> <name><surname>Moisan</surname> <given-names>F.</given-names></name> <name><surname>Aggarwal</surname> <given-names>P.</given-names></name> <name><surname>Gonzalez</surname> <given-names>C.</given-names></name></person-group> (<year>2022</year>). <article-title>Truth-telling in a sender&#x2013;receiver game: social value orientation and incentives</article-title>. <source>Symmetry</source> <volume>14</volume>:<fpage>1561</fpage>. doi: <pub-id pub-id-type="doi">10.3390/sym14081561</pub-id></citation></ref>
<ref id="ref42"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Zhang</surname> <given-names>L.</given-names></name> <name><surname>Lengersdorff</surname> <given-names>L.</given-names></name> <name><surname>Mikus</surname> <given-names>N.</given-names></name> <name><surname>Gl&#x00E4;scher</surname> <given-names>J.</given-names></name> <name><surname>Lamm</surname> <given-names>C.</given-names></name></person-group> (<year>2020</year>). <article-title>Using reinforcement learning models in social neuroscience: Frameworks, pitfalls and suggestions of best practices</article-title>. <source>Social Cognitive and Affective Neuroscience</source>, <volume>15</volume>, <fpage>695</fpage>&#x2013;<lpage>707</lpage>. doi: <pub-id pub-id-type="doi">10.1093/scan/nsaa089</pub-id></citation></ref>
<ref id="ref43"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Zhao</surname> <given-names>H.</given-names></name> <name><surname>Zhang</surname> <given-names>T.</given-names></name> <name><surname>Cheng</surname> <given-names>T.</given-names></name> <name><surname>Chen</surname> <given-names>C.</given-names></name> <name><surname>Zhai</surname> <given-names>Y.</given-names></name> <name><surname>Liang</surname> <given-names>X.</given-names></name> <etal/></person-group>. (<year>2023</year>). <article-title>Neurocomputational mechanisms of young children&#x2019;s observational learning of delayed gratification</article-title>. <source>Cereb. Cortex</source> <volume>33</volume>, <fpage>6063</fpage>&#x2013;<lpage>6076</lpage>. doi: <pub-id pub-id-type="doi">10.1093/cercor/bhac484</pub-id>, PMID: <pub-id pub-id-type="pmid">36562999</pub-id></citation></ref>
<ref id="ref44"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Zonca</surname> <given-names>J.</given-names></name> <name><surname>Vostroknutov</surname> <given-names>A.</given-names></name> <name><surname>Coricelli</surname> <given-names>G.</given-names></name> <name><surname>Polonio</surname> <given-names>L.</given-names></name></person-group> (<year>2021</year>). <article-title>Timing of social feedback shapes observational learning in strategic interaction</article-title>. <source>Sci. Rep.</source> <volume>11</volume>:<fpage>21972</fpage>. doi: <pub-id pub-id-type="doi">10.1038/s41598-021-01466-1</pub-id>, PMID: <pub-id pub-id-type="pmid">34754038</pub-id></citation></ref>
</ref-list>
</back>
</article>