<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "http://dtd.nlm.nih.gov/publishing/2.0/journalpublishing.dtd">
<article xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article" dtd-version="2.0">
  <front>
    <journal-meta>
      <journal-id journal-id-type="publisher-id">JSG</journal-id>
      <journal-id journal-id-type="nlm-ta">JMIR Serious Games</journal-id>
      <journal-title>JMIR Serious Games</journal-title>
      <issn pub-type="epub">2291-9279</issn>
      <publisher>
        <publisher-name>JMIR Publications</publisher-name>
        <publisher-loc>Toronto, Canada</publisher-loc>
      </publisher>
    </journal-meta>
    <article-meta>
      <article-id pub-id-type="publisher-id">v10i4e41097</article-id>
      <article-id pub-id-type="pmid">36480248</article-id>
      <article-id pub-id-type="doi">10.2196/41097</article-id>
      <article-categories>
        <subj-group subj-group-type="heading">
          <subject>Original Paper</subject>
        </subj-group>
        <subj-group subj-group-type="article-type">
          <subject>Original Paper</subject>
        </subj-group>
      </article-categories>
      <title-group>
        <article-title>An Automated Virtual Reality Training System for Teacher-Student Interaction: A Randomized Controlled Trial</article-title>
      </title-group>
      <contrib-group>
        <contrib contrib-type="editor">
          <name>
            <surname>Zary</surname>
            <given-names>Nabil</given-names>
          </name>
        </contrib>
        <contrib contrib-type="editor">
          <name>
            <surname>Eysenbach</surname>
            <given-names>Gunther</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib contrib-type="reviewer">
          <name>
            <surname>See</surname>
            <given-names>Christopher</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib id="contrib1" contrib-type="author" corresp="yes">
          <name name-style="western">
            <surname>King</surname>
            <given-names>Seth</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <address>
            <institution>Department of Teaching and Learning</institution>
            <institution>College of Education</institution>
            <institution>University of Iowa</institution>
            <addr-line>240 S. Madison St.</addr-line>
            <addr-line>Iowa City, IA, 52242</addr-line>
            <country>United States</country>
            <phone>1 828 448 0950</phone>
            <email>sakng@uiowa.edu</email>
          </address>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-7142-8694</ext-link>
        </contrib>
        <contrib id="contrib2" contrib-type="author">
          <name name-style="western">
            <surname>Boyer</surname>
            <given-names>Joseph</given-names>
          </name>
          <degrees>MA</degrees>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-0537-3522</ext-link>
        </contrib>
        <contrib id="contrib3" contrib-type="author">
          <name name-style="western">
            <surname>Bell</surname>
            <given-names>Tyler</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-2205-7310</ext-link>
        </contrib>
        <contrib id="contrib4" contrib-type="author">
          <name name-style="western">
            <surname>Estapa</surname>
            <given-names>Anne</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-9810-0821</ext-link>
        </contrib>
      </contrib-group>
      <aff id="aff1">
        <label>1</label>
        <institution>Department of Teaching and Learning</institution>
        <institution>College of Education</institution>
        <institution>University of Iowa</institution>
        <addr-line>Iowa City, IA</addr-line>
        <country>United States</country>
      </aff>
      <aff id="aff2">
        <label>2</label>
        <institution>Department of Electrical and Computer Engineering</institution>
        <institution>College of Engineering</institution>
        <institution>University of Iowa</institution>
        <addr-line>Iowa City, IA</addr-line>
        <country>United States</country>
      </aff>
      <author-notes>
        <corresp>Corresponding Author: Seth King <email>sakng@uiowa.edu</email></corresp>
      </author-notes>
      <pub-date pub-type="collection">
        <season>Oct-Dec</season>
        <year>2022</year>
      </pub-date>
      <pub-date pub-type="epub">
        <day>8</day>
        <month>12</month>
        <year>2022</year>
      </pub-date>
      <volume>10</volume>
      <issue>4</issue>
      <elocation-id>e41097</elocation-id>
      <history>
        <date date-type="received">
          <day>28</day>
          <month>7</month>
          <year>2022</year>
        </date>
        <date date-type="rev-request">
          <day>7</day>
          <month>9</month>
          <year>2022</year>
        </date>
        <date date-type="rev-recd">
          <day>18</day>
          <month>9</month>
          <year>2022</year>
        </date>
        <date date-type="accepted">
          <day>2</day>
          <month>11</month>
          <year>2022</year>
        </date>
      </history>
      <copyright-statement>©Seth King, Joseph Boyer, Tyler Bell, Anne Estapa. Originally published in JMIR Serious Games (https://games.jmir.org), 08.12.2022.</copyright-statement>
      <copyright-year>2022</copyright-year>
      <license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/">
        <p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (https://creativecommons.org/licenses/by/4.0/), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in JMIR Serious Games, is properly cited. The complete bibliographic information, a link to the original publication on https://games.jmir.org, as well as this copyright and license information must be included.</p>
      </license>
      <self-uri xlink:href="https://games.jmir.org/2022/4/e41097" xlink:type="simple"/>
      <abstract>
        <sec sec-type="background">
          <title>Background</title>
          <p>Shortages in qualified supervision and other resources prevent education personnel from rehearsing effective practices. Interactive simulations, although increasingly used in education, frequently require instructor management. Automated simulations rarely engage trainees in skills related to practice (eg, speech).</p>
        </sec>
        <sec sec-type="objective">
          <title>Objective</title>
          <p>We evaluated the capability of delivering behavioral skills training through an automated virtual reality (VR) simulation using artificial intelligence to improve the implementation of a nondirective mathematical questioning strategy.</p>
        </sec>
        <sec sec-type="methods">
          <title>Methods</title>
          <p>We recruited and randomly assigned 30 college-aged participants to equivalent treatment (ie, lecture, modeling, and VR; 15/30, 50%) and control groups (ie, lecture and modeling only; 15/30, 50%). The participants were blind to treatment conditions. Sessions and assessments were conducted face to face and involved the use of VR for assessment regardless of the condition. Lessons concerned the use of a nondirective mathematical questioning strategy in instances where a simulated student provided correct or incorrect answers to word problems. The measures included observed and automated assessments of participant performance and subjective assessments of participant confidence. The participants completed the pretest, posttest, and maintenance probes each week over the course of 3 weeks.</p>
        </sec>
        <sec sec-type="results">
          <title>Results</title>
          <p>A mixed ANOVA revealed significant main effects of time (<italic>F</italic><sub>2,27</sub>=124.154; <italic>P&#60;</italic>.001; η<italic><sub>p</sub></italic><sup>2</sup>=0.816) and treatment (<italic>F</italic><sub>1,28</sub>=19.281; <italic>P&#60;</italic>.001; η<italic><sub>p</sub></italic><sup>2</sup>=0.408) as well as an interaction effect (<italic>F</italic><sub>2,28</sub>=8.429; <italic>P&#60;</italic>.001; η<italic><sub>p</sub></italic><sup>2</sup>=0.231) for the average percentage of steps in the questioning procedure. Posttest scores for the intervention group (mean 88%, SD 22.62%) exceeded those of the control group (mean 63.33%, SD 22.64%), with <italic>t</italic><sub>28</sub>=3.653, <italic>P</italic>&#60;.001, and Cohen <italic>d</italic>=1.334. Maintenance scores indicated a positive effect of the intervention (mean 83.33%, SD 24.40%) relative to the control (mean 54.67%, SD 15.98%), <italic>t</italic><sub>28</sub>=3.807, <italic>P</italic>&#60;.001, Cohen <italic>d</italic>=1.39. A Mann-Whitney <italic>U</italic> test indicated that the treatment groups’ self-ratings of confidence (mean 2.41, SD 0.51) were higher than those of the control group (mean 2.04, SD 0.52), <italic>U</italic>=64, <italic>P</italic>=.04, <italic>r</italic>=0.137.</p>
        </sec>
        <sec sec-type="conclusions">
          <title>Conclusions</title>
          <p>The results demonstrate the potential of artificial intelligence-augmented VR to deliver effective, evidence-based training with limited instructor management. Additional work is needed to demonstrate the cascading effect of training on authentic practice and to encompass a wider range of skills.</p>
        </sec>
      </abstract>
      <kwd-group>
        <kwd>virtual reality</kwd>
        <kwd>artificial intelligence</kwd>
        <kwd>behavioral skills training</kwd>
        <kwd>education</kwd>
        <kwd>professional development</kwd>
        <kwd>staff training</kwd>
        <kwd>mathematics</kwd>
      </kwd-group>
    </article-meta>
  </front>
  <body>
    <sec sec-type="introduction">
      <title>Introduction</title>
      <sec>
        <title>Background</title>
        <p>High-quality professional development contributes to the effectiveness of education personnel [<xref ref-type="bibr" rid="ref1">1</xref>] and success of their students [<xref ref-type="bibr" rid="ref2">2</xref>]. However, the training education professionals receive before entering the field often consists of lectures [<xref ref-type="bibr" rid="ref3">3</xref>] with few opportunities to practice skills or receive performance feedback—key aspects of effective professional development [<xref ref-type="bibr" rid="ref4">4</xref>-<xref ref-type="bibr" rid="ref6">6</xref>]. Training ideally provides multiple opportunities for practice across a range of unpredictable situations under the supervision of a competent observer [<xref ref-type="bibr" rid="ref7">7</xref>]. The prevalence of less effective approaches to professional development stems from a shortage of qualified supervisors and suitable practicum placements in many areas [<xref ref-type="bibr" rid="ref6">6</xref>,<xref ref-type="bibr" rid="ref8">8</xref>]. The difficulty in providing effective training for education personnel has perpetuated the use of ineffective practices in education [<xref ref-type="bibr" rid="ref9">9</xref>].</p>
        <p>Head-mounted virtual reality (VR) using an array of visual, auditory, and tactile interfaces that adjusts the display based on user sensorimotor inputs to fully immerse participants within a simulation [<xref ref-type="bibr" rid="ref10">10</xref>] is increasingly associated with improved learner outcomes, increased engagement, and the ability to repeatedly practice skills [<xref ref-type="bibr" rid="ref11">11</xref>,<xref ref-type="bibr" rid="ref12">12</xref>]. The immersion permitted by VR potentially allows educators to engage in behaviors and interact with stimuli closely aligned with actual practice, which can potentially improve the administration of instruction and increase teacher confidence [<xref ref-type="bibr" rid="ref13">13</xref>]. The maximum immersion permitted through VR may not be necessary in all scenarios (eg, conversation); however, VR allows for a realistic representation of nonverbal communication that accompanies speech as well as any potential physical interactions. In addition, <italic>removing</italic> components from a fully immersive simulation to place core content on platforms such as desktops is technically easier than <italic>adding</italic> critical immersive elements to simulations developed on less-sophisticated devices [<xref ref-type="bibr" rid="ref14">14</xref>]. VR applications can be adapted to preserve their core functionality across a range of devices, thus making development on the platform potentially conducive to dissemination.</p>
        <p>The technology associated with VR has become more affordable [<xref ref-type="bibr" rid="ref15">15</xref>]; however, it is most frequently used as a training tool in medicine [<xref ref-type="bibr" rid="ref16">16</xref>]. The results of VR simulations tested in the educational context are mixed, with early reports of limited effectiveness and induced illness [<xref ref-type="bibr" rid="ref15">15</xref>] being contradicted only by recent research with more positive findings [<xref ref-type="bibr" rid="ref17">17</xref>]. VR simulations specific to teacher education typically require trainees to observe events depicted in 3D space (eg, bullying behavior and self-injury) rather than interact [<xref ref-type="bibr" rid="ref13">13</xref>,<xref ref-type="bibr" rid="ref18">18</xref>]. VR simulations targeting human interaction are typically controlled directly by expert trainers; at a minimum, human observers must administer assessments [<xref ref-type="bibr" rid="ref13">13</xref>]. Experiments involving the performance of complex procedures (eg, functional communication training [<xref ref-type="bibr" rid="ref19">19</xref>]), although they include scripts to simulate the behavior of student avatars, rely on researchers to assess trainees.</p>
        <p>Although absent from studies of teacher training, artificial intelligence (AI)—or software capable of independently acquiring, processing, and acting upon information [<xref ref-type="bibr" rid="ref20">20</xref>]—is emerging as a force in education through the growing implementation of chatbots, automated assessment, facial recognition, and other functions to support teaching and learning [<xref ref-type="bibr" rid="ref21">21</xref>]. AI relies on machine learning (ie, natural language processing) in which computers are trained to classify new stimuli following exposure to previous data sets (ie, training data) and statistical models to make predictions based on new information [<xref ref-type="bibr" rid="ref22">22</xref>]. Intelligent tutoring systems, which provide individualized instruction based on the responses and characteristics of learners, encompass many AI functions relevant to education, including learner assessment, content generation, and providing feedback [<xref ref-type="bibr" rid="ref23">23</xref>]. An increasing number of programs targeting specific academic skills in K-12 and higher education have recently emerged [<xref ref-type="bibr" rid="ref22">22</xref>], such as the IBM Watson Tutor, a dialogue-based tutor that uses natural language processing to interpret learners’ comments and provide appropriate feedback [<xref ref-type="bibr" rid="ref24">24</xref>]. However, studies integrating VR and AI are currently limited [<xref ref-type="bibr" rid="ref22">22</xref>]. Existing applications incorporating AI, such as Lamb and Etopio’s classroom management scenarios [<xref ref-type="bibr" rid="ref25">25</xref>], allow for participant interaction with student avatars but do not assess the implementation of discrete instructional practices.</p>
        <p>A recent experiment [<xref ref-type="bibr" rid="ref14">14</xref>] demonstrated the effectiveness of an automated VR simulation capable of administering instructional procedures and assessing learner performance on the use of a mathematical questioning procedure. Evidence suggests that nondirective mathematical questioning, in which students’ thought processes are elicited before confirming whether an answer is correct, can improve student outcomes [<xref ref-type="bibr" rid="ref26">26</xref>]. Effective questions require students to assess, explain, and justify their answers [<xref ref-type="bibr" rid="ref27">27</xref>]. This process facilitates instructional decisions, especially when teachers cannot observe the problem-solving process or the correct answer may be derived through an inefficient or inappropriate approach [<xref ref-type="bibr" rid="ref28">28</xref>]. Interaction-focused techniques such as mathematical questioning, which involves the assessment of speech rather than simple movements or button presses, differ from the content generally addressed in VR training simulations.</p>
        <p>The training developed by King et al [<xref ref-type="bibr" rid="ref14">14</xref>] consisted of video-recorded lectures and simulations capable of providing automatic assessment, textual prompting, and feedback through the incorporation of VR and AI (eg, speech classification and speech-to-text). As in the research conducted by Clay et al [<xref ref-type="bibr" rid="ref19">19</xref>], the components of the intervention were arranged in accordance with behavioral skills training (BST), an evidence-based approach to personnel preparation encompassing a range of instructional components, including didactic instruction, modeling, rehearsal, and feedback [<xref ref-type="bibr" rid="ref29">29</xref>,<xref ref-type="bibr" rid="ref30">30</xref>]. Textual onscreen prompts, systematic prompting, and video models were incorporated based on evidence of their effectiveness in the literature [<xref ref-type="bibr" rid="ref31">31</xref>-<xref ref-type="bibr" rid="ref33">33</xref>]. The use of a single-case design [<xref ref-type="bibr" rid="ref34">34</xref>-<xref ref-type="bibr" rid="ref36">36</xref>] permitted improvements in simulation functionality over the course of the experiment, resulting in automated assessments with a high degree of agreement with direct observation (&#62;96%) and large changes in the percentage of steps in the procedure exhibited by the two participating trainees after 3 consecutive days of training (Tau<sub>bc</sub>=0.80 [<xref ref-type="bibr" rid="ref37">37</xref>]).</p>
        <p>In contrast to many approaches to VR, which are not constructed in accordance with a specific learning theory [<xref ref-type="bibr" rid="ref38">38</xref>], the simulation developed by King et al [<xref ref-type="bibr" rid="ref14">14</xref>] was predicated on behavioral theories of learning and instruction [<xref ref-type="bibr" rid="ref39">39</xref>] that aim to encourage appropriate responses in the presence of specific antecedents (ie, discriminative stimuli), for example, praising a student for correctly answering a math problem. The ability of an antecedent to evoke the correct response can be increased and sustained through the introduction and gradual fading of prompts. Instructors may also administer consequences designed to increase correct responses, which can include providing stimuli of value to the learner (ie, positive reinforcement) or allowing the learner to avoid unpleasant stimuli (ie, negative reinforcement) [<xref ref-type="bibr" rid="ref39">39</xref>]. Prompts and consequences are most effective when provided immediately. In King et al [<xref ref-type="bibr" rid="ref14">14</xref>], the responses generated by simulated students represented antecedents associated with the correct steps of a procedure. The participants received textual prompts before they had an opportunity to respond. In addition, the simulation provided correctives immediately following incorrect responses and required the participants to provide a correct response. The avoidance of corrective procedures upon the use of correct responses in subsequent sessions and feedback regarding correct answers following each session provided negative and positive reinforcement, respectively. Notwithstanding this theoretical basis and the positive findings associated with the simulation, the small sample size and iterative development that occurred over the course of the experiment represent clear limitations.</p>
      </sec>
      <sec>
        <title>Purpose</title>
        <p>Given the scarce resources available for training, a simulation capable of independently providing assessment and instruction related to student-teacher interaction has the potential to benefit education personnel as well as their students and result in the wider dissemination of professional development. In light of the limitations of earlier work in this area [<xref ref-type="bibr" rid="ref14">14</xref>], this study assessed the ability of a feature-locked, AI-enhanced VR training application to independently impart the steps of a mathematical questioning strategy using a randomized controlled design. The guiding questions included the following: (1) Compared with individuals who did not receive training in VR, does the simulation improve the participants’ acquisition of steps in a mathematical questioning strategy? (2) To what extent does group performance differ during maintenance (ie, extended absence of instruction) and generalization (ie, untaught items) probes? (3) Does the VR simulation increase the participants’ perceived confidence in the use of the procedure, relative to the control group? (4) To what extent do the observed measures of trainee performance correspond with the automated measures?</p>
      </sec>
    </sec>
    <sec sec-type="methods">
      <title>Methods</title>
      <sec>
        <title>Ethics Approval</title>
        <p>The university institutional review board at the University of Iowa approved all procedures and consent forms before recruitment (202112205).</p>
      </sec>
      <sec>
        <title>Participants and Setting</title>
        <p>Recruitment began in January 2022. The study was conducted throughout March and April 2022. Eligible participants were current and former graduate and undergraduate students affiliated with the University of Iowa. Potential participants were (1) aged &#62;18 years; (2) free of seizure disorders, epilepsy, or other health conditions potentially exacerbated by VR; and (3) able to use voice-activated assistants such as Alexa without accommodations. In addition, we excluded participants who were likely to be familiar with the subject material (ie, participants with employment experience in an educational setting or participants with records of completing courses in mathematics education) to ensure sufficient sensitivity to the intervention. A US $15 gift card was offered as an incentive for participation. For recruitment, the second author described the study to students in cooperating classrooms; the participants were also encouraged to share information regarding the study with potentially interested peers. In total, 30 individuals agreed to participate in this study. We assigned the participants to the experimental groups using a stratified randomization [<xref ref-type="bibr" rid="ref40">40</xref>] procedure based on observed mastery probes (OMPs) during the baseline phase. No attrition occurred over the course of the study. A survey of participant characteristics revealed no significant differences in familiarity with VR before the experiment. Additional demographic characteristics of the participants are shown in <xref ref-type="table" rid="table1">Table 1</xref>.</p>
        <p>Sessions and assessments were administered face to face in a small room with computer and internet access. Each participant’s sessions occurred once per week for 3 consecutive weeks. Scheduling ensured that approximately 7 days elapsed between the assessment sessions, which otherwise occurred at times acceptable to the participants. The participants were advised to terminate the sessions at the first sign of discomfort; however, all the sessions were completed without any incident. A master’s-level student in computer engineering (ie, the session administrator) conducted all the sessions with the participants individually.</p>
        <table-wrap position="float" id="table1">
          <label>Table 1</label>
          <caption>
            <p>Participant demographics.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="30"/>
            <col width="330"/>
            <col width="210"/>
            <col width="220"/>
            <col width="210"/>
            <thead>
              <tr valign="bottom">
                <td colspan="2">Participant</td>
                <td>Total (N=30)</td>
                <td>Control (n=15)</td>
                <td>VR<sup>a</sup> (n=15)</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td colspan="2">Age (years), mean (SD); range</td>
                <td>22.13 (1.5); 19-26</td>
                <td>21.87 (1.81); 19-26</td>
                <td>22.4 (1.12); 21-25</td>
              </tr>
              <tr valign="top">
                <td colspan="5">
                  <bold>Sex<sup>b</sup>, n (%)</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Male</td>
                <td>16 (53)</td>
                <td>8 (53)</td>
                <td>8 (53)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Female</td>
                <td>14 (47)</td>
                <td>7 (47)</td>
                <td>7 (47)</td>
              </tr>
              <tr valign="top">
                <td colspan="5">
                  <bold>Academic program, n (%)</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Business or finance</td>
                <td>8 (27)</td>
                <td>4 (27)</td>
                <td>4 (27)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Engineering</td>
                <td>13 (43)</td>
                <td>6 (40)</td>
                <td>7 (47)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Other</td>
                <td>9 (30)</td>
                <td>5 (33)</td>
                <td>4 (27)</td>
              </tr>
              <tr valign="top">
                <td colspan="5">
                  <bold>Educational status, n (%)</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Undergraduate</td>
                <td>15 (50)</td>
                <td>9 (60)</td>
                <td>6 (40)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Masters</td>
                <td>6 (20)</td>
                <td>2 (13)</td>
                <td>4 (27)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Doctoral</td>
                <td>2 (7)</td>
                <td>2 (13)</td>
                <td>0 (0)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Other</td>
                <td>7 (23)</td>
                <td>2 (13)</td>
                <td>5 (33)</td>
              </tr>
              <tr valign="top">
                <td colspan="2">VR experience<sup>c</sup>, mean (SD); range</td>
                <td>4.47 (1.74); 1-6</td>
                <td>4.47 (1.73); 1-6</td>
                <td>4.47 (1.81); 1-6</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table1fn1">
              <p><sup>a</sup>VR: virtual reality.</p>
            </fn>
            <fn id="table1fn2">
              <p><sup>b</sup>None of the participants identified as being nonbinary.</p>
            </fn>
            <fn id="table1fn3">
              <p><sup>c</sup>VR experience was determined using a 6-item Likert-type scale ranging from 1 (no experience) to 6 (much experience).</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
      </sec>
      <sec>
        <title>Materials</title>
        <p>A commercially available Windows (Microsoft Corp) desktop computer facilitated video playback. We used the Oculus Quest 2 (Facebook Reality Labs; US $300) VR headset and its 2 controllers for all the instructional simulations. The Quest device has an integrated microphone and speakers and tracks motion without external sensors.</p>
      </sec>
      <sec>
        <title>Dependent Variables</title>
        <sec>
          <title>Overview</title>
          <p>This study examined 6 distinct dependent variables. The observed percentage of lesson steps completed correctly (ie, OMP) represented the principal outcome. To evaluate the simulation’s assessment capabilities, we compared the results of the OMPs with those of a virtual mastery probe (VMP) assessing the same skills. We obtained additional information regarding the perceptions of the participants from the SKIL Survey [<xref ref-type="bibr" rid="ref41">41</xref>].</p>
        </sec>
        <sec>
          <title>OMP Assessment</title>
          <p>For the OMPs, the session administrator collected information regarding the percentage of steps in the questioning procedure that the participants completed while interacting with the student avatar in the VR simulation. We calculated the results in terms of the total number of steps performed correctly divided by the total number of steps in procedures taught in lessons 1 and 2 combined (ie, 10 steps). The OMPs were created in relation to the content taught during training (ie, <italic>acquisition</italic> probes) to assess the participants across the baseline, posttest, and maintenance sessions as well as untaught content to assess the generalization of the procedure in posttest and maintenance sessions (ie, <italic>generalization</italic> probes). The steps in the acquisition probe are shown in <xref ref-type="table" rid="table2">Table 2</xref> (refer to “teacher steps”). We scored the OMPs in accordance with the single-opportunity method, in which the probe ended as soon as the participant exhibited an incorrect response [<xref ref-type="bibr" rid="ref42">42</xref>] because of (1) concerns regarding time commitment and (2) the chance of skill acquisition in the absence of instruction. Research suggests that single-opportunity method probes of chained tasks contribute relatively little bias [<xref ref-type="bibr" rid="ref42">42</xref>]. The participants did not receive feedback following the completion of the OMPs.</p>
          <table-wrap position="float" id="table2">
            <label>Table 2</label>
            <caption>
              <p>Steps in lessons 1 and 2 for teachers and simulated student.</p>
            </caption>
            <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
              <col width="30"/>
              <col width="230"/>
              <col width="360"/>
              <col width="380"/>
              <thead>
                <tr valign="top">
                  <td colspan="2">Step</td>
                  <td>Description</td>
                  <td>Example and variations</td>
                </tr>
              </thead>
              <tbody>
                <tr valign="top">
                  <td colspan="4">
                    <bold>Lesson 1: responding to a correct answer</bold>
                  </td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>T1<sup>a</sup>: read the problem</td>
                  <td>The teacher reads the problem clearly and without errors</td>
                  <td>
                    <list list-type="bullet">
                      <list-item>
                        <p>“You have 5 fishbowls with 4 fish in each bowl. How many fish are there total?”</p>
                      </list-item>
                    </list>
                  </td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>S1<sup>b</sup>: brief student correct answer</td>
                  <td>The student provides the correct answer without additional detail</td>
                  <td>
                    <list list-type="bullet">
                      <list-item>
                        <p>“There are 20 fish.”</p>
                      </list-item>
                      <list-item>
                        <p>“The answer is 20.”<sup>c</sup></p>
                      </list-item>
                    </list>
                  </td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>T2: unpack strategy request (correct)</td>
                  <td>After the student provides the correct answer, the teacher asks the student to explain</td>
                  <td>
                    <list list-type="bullet">
                      <list-item>
                        <p>“How did you solve this problem?”</p>
                      </list-item>
                      <list-item>
                        <p>“Why is that the answer?”</p>
                      </list-item>
                    </list>
                  </td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>S2: student unpacks correct strategy</td>
                  <td>The student describes the appropriate method they used for answer</td>
                  <td>
                    <list list-type="bullet">
                      <list-item>
                        <p>“I multiplied 5 times 4.”</p>
                      </list-item>
                      <list-item>
                        <p>“I took 5 and 4 and multiplied.”</p>
                      </list-item>
                    </list>
                  </td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>T3: Praise</td>
                  <td>The teacher praises the student’s effort</td>
                  <td>
                    <list list-type="bullet">
                      <list-item>
                        <p>“Good job.”</p>
                      </list-item>
                      <list-item>
                        <p>“Nice job, buddy.”</p>
                      </list-item>
                    </list>
                  </td>
                </tr>
                <tr valign="top">
                  <td colspan="4">
                    <bold>Lesson 2: responding to an incorrect answer</bold>
                  </td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>T1: read the problem</td>
                  <td>—<sup>d</sup></td>
                  <td>—</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>S1: brief student incorrect answer</td>
                  <td>The student provides an incorrect answer without additional detail</td>
                  <td>
                    <list list-type="bullet">
                      <list-item>
                        <p>“I don’t know. Nine fish?”</p>
                      </list-item>
                      <list-item>
                        <p>“It’s nine fish I think.”</p>
                      </list-item>
                    </list>
                  </td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>T2: unpack strategy request (incorrect)</td>
                  <td>After the student provides an incorrect answer, the teacher asks the student to explain</td>
                  <td>—</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>S2: student unpacks incorrect strategy</td>
                  <td>The student describes the inappropriate method they used for answer</td>
                  <td>
                    <list list-type="bullet">
                      <list-item>
                        <p>“I added 5 plus 4.”</p>
                      </list-item>
                      <list-item>
                        <p>“I used addition.”</p>
                      </list-item>
                    </list>
                  </td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>T3a: underscore task feature (strategy)</td>
                  <td>The teacher asks why the student used a specific incorrect strategy</td>
                  <td>
                    <list list-type="bullet">
                      <list-item>
                        <p>“What in the problem made you add?”</p>
                      </list-item>
                      <list-item>
                        <p>“Tell me why you used addition.”<sup>e</sup></p>
                      </list-item>
                    </list>
                  </td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>S3: strategy explication</td>
                  <td>The student describes why they used an incorrect strategy</td>
                  <td>
                    <list list-type="bullet">
                      <list-item>
                        <p>“Well, you said there were 5 fishbowls and 4 fish.”</p>
                      </list-item>
                      <list-item>
                        <p>“I didn’t know what to do, so I added.”</p>
                      </list-item>
                    </list>
                  </td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>T3b: underscore task feature (problem)</td>
                  <td>The teacher prompts the student to re-examine the problem</td>
                  <td>
                    <list list-type="bullet">
                      <list-item>
                        <p>“What is the problem asking you to do?”</p>
                      </list-item>
                    </list>
                  </td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>S4: feature identification</td>
                  <td>The student proposes a new approach based on the problem features</td>
                  <td>
                    <list list-type="bullet">
                      <list-item>
                        <p>“I see. I need to count the fish in all of the bowls.”</p>
                      </list-item>
                      <list-item>
                        <p>“I need to add five ‘4s’ together.”</p>
                      </list-item>
                    </list>
                  </td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>T4: teacher grouping request</td>
                  <td>The teacher asks the student to attempt the problem again</td>
                  <td>
                    <list list-type="bullet">
                      <list-item>
                        <p>“What would your answer be now?”</p>
                      </list-item>
                      <list-item>
                        <p>“Can you try solving again?”</p>
                      </list-item>
                    </list>
                  </td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>S5: brief student correct answer</td>
                  <td>The student provides the correct answer without additional detail</td>
                  <td>
                    <list list-type="bullet">
                      <list-item>
                        <p>“You would have 20 fish then.”</p>
                      </list-item>
                      <list-item>
                        <p>“The answer is 20.”</p>
                      </list-item>
                    </list>
                  </td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>T5: unpack strategy request (correct)</td>
                  <td>—</td>
                  <td>—</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>S6: student unpacks correct strategy</td>
                  <td>—</td>
                  <td>—</td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>T6: praise</td>
                  <td>—</td>
                  <td>—</td>
                </tr>
              </tbody>
            </table>
            <table-wrap-foot>
              <fn id="table2fn1">
                <p><sup>a</sup>T: teacher.</p>
              </fn>
              <fn id="table2fn2">
                <p><sup>b</sup>S: student.</p>
              </fn>
              <fn id="table2fn3">
                <p><sup>c</sup>To prevent rote responding, the students provided varied responses for each step. Some examples are not exhaustive.</p>
              </fn>
              <fn id="table2fn4">
                <p><sup>d</sup>The content is identical to previous version of the step.</p>
              </fn>
              <fn id="table2fn5">
                <p><sup>e</sup>Variations for teachers refer to potentially correct examples. Examples are not exhaustive.</p>
              </fn>
            </table-wrap-foot>
          </table-wrap>
        </sec>
        <sec>
          <title>SKIL Survey</title>
          <p>We assessed the respondents’ stated understanding of questioning using an adapted version of the SKIL Survey [<xref ref-type="bibr" rid="ref41">41</xref>]. The survey consisted of concepts rated across three scales: (1) <italic>knowledge</italic> of the content, (2) <italic>confidence</italic> in the use of the techniques, and (3) perceived <italic>usefulness</italic>. The respondents rated the items using a 4-point Likert-type scale ranging from 0 (eg, <italic>no knowledge</italic>) to 3 (eg, <italic>substantial knowledge</italic>). We presented a small sample of eight assessment items because of the narrow focus of the training. Surveys featuring a reduced number of items obtained acceptable internal consistency in previous studies, with a Cronbach α for knowledge of .907, confidence of .882, and usefulness of .915 [<xref ref-type="bibr" rid="ref13">13</xref>]. We delivered instructions regarding the purpose of the assessment before each administration. The participants completed the SKIL Survey during the baseline and maintenance sessions.</p>
        </sec>
        <sec>
          <title>VMP Assessment</title>
          <p>The VMP and OMPs were administered concurrently to determine the correspondence between the simulation-administered assessments and direct observations conducted by a human. The VMP assessed the exact same steps in the procedure as the acquisition and generalization OMPs via the speech classifier embedded in the simulation, which (1) recorded textual output corresponding to a participant’s spoken response, (2) determined whether the text’s classification matched the classification of correct responses for each step, and (3) calculated the percentage of correct steps completed by the participant.</p>
        </sec>
      </sec>
      <sec>
        <title>Design</title>
        <p>We analyzed the effectiveness of the intervention using a single-blind, independent measures pretest-posttest design. The participants were placed in an intervention condition (ie, lecture, model, and VR practice) or a control condition (lecture and model only) using stratified random assignment [<xref ref-type="bibr" rid="ref40">40</xref>] based on baseline OMP scores. Randomization was achieved using Microsoft Excel. The identities of the participants were concealed from the researchers during the randomization process.</p>
      </sec>
      <sec>
        <title>Simulation</title>
        <p>The VR simulation featured in this study was developed over the course of 2 years by an interdisciplinary team consisting of faculty in behavior analysis, math education, and computer engineering. A task analysis [<xref ref-type="bibr" rid="ref39">39</xref>] of mathematical questioning was conducted to identify the teacher and student actions emitted during applications of mathematical questioning. In a departure from the typical task analysis procedure, we created different lessons based on likely student responses. The initial analysis included many possible variations accounting for student actions such as nonresponses. This became the basis for the skills evaluated in this study: (1) responding to a correct answer and (2) responding to an incorrect answer (ie, lessons 1 and 2). An example of the flowcharts resulting from this process that illustrate the possible sequences of events in a scenario, as well as sequences in lessons 1 and 2, are shown in <xref rid="figure1" ref-type="fig">Figure 1</xref>. <xref ref-type="table" rid="table2">Table 2</xref> describes the specific steps in each lesson.</p>
        <p>The simulation corresponding to the mathematical questioning procedure consisted of multiple components. A custom React [<xref ref-type="bibr" rid="ref43">43</xref>] web application permitted the generation of simulation content (eg, steps in a procedure), which was stored in a database for retrieval by the simulation. <xref rid="figure2" ref-type="fig">Figure 2</xref> depicts the web application used to generate flowcharts, allowing for different lessons based on the anticipated student responses. The application further allowed for the generation of reports regarding the performance of the participants (<xref rid="figure3" ref-type="fig">Figure 3</xref>). The simulation, developed in Unity (Unity Technologies), allows trainees to interact with a virtual student in a simulated classroom environment. All VR assessments and instructional sessions across experimental conditions began with the participant verbally presenting the student avatar with a math problem involving multiplication before deviating into different pathways based on the initial student response. A depiction of the start of a typical simulation and user prompt is shown in <xref rid="figure4" ref-type="fig">Figure 4</xref>. We trained the speech classification AI to recognize the topographical variations of potential participant statements. The key technical aspects of this work include (1) the ability of the virtual student to speak to the participant, (2) the ability of the participant to vocally respond to the virtual student, and (3) the ability of the simulation to classify the participant’s responses as correct or incorrect.</p>
        <p>Speech from the student avatar was accomplished using IBM Watson’s [<xref ref-type="bibr" rid="ref44">44</xref>] Text-to-Speech, which converted text strings corresponding to predetermined student responses into audio data. To promote the extent to which trainees responded correctly to distinct student statements that should nonetheless evoke a similar step in the procedure (eg, incorrect response; nonresponse) [<xref ref-type="bibr" rid="ref45">45</xref>], student avatar responses at each step were drawn from functionally identical yet topographically dissimilar text strings. Examples of the student statements are listed in <xref ref-type="table" rid="table2">Table 2</xref>.</p>
        <p>Assessment of the trainees’ responses was accomplished using IBM’s Speech-to-Text, which converted the trainees’ statements into a text string, and the Google Natural Language AI service [<xref ref-type="bibr" rid="ref46">46</xref>], which determined whether a trainee’s transcribed statement matched the targeted response for a specific step of the procedure. The text classifier was trained using phrases corresponding to each step of the simulation (<xref ref-type="table" rid="table2">Table 2</xref>). After training, the classifier could be used to identify novel text strings that did not perfectly match the training phrases. This allowed the simulation to accommodate variability in the trainees’ responses. The classifier would provide a confidence value between 0.00 and 1.00, specifying the degree to which the provided text corresponded to each step of the procedure. Higher values reflected a greater degree of confidence in a statement’s correspondence to the phrases included in the training. We established a classifier threshold (eg, 0.75) to determine how closely the participants’ responses needed to match the expected response at each step. If the classification confidence exceeded the threshold, the system identified the participants’ responses as correct.</p>
        <p>When combined with recorded lectures describing the rationale for a procedure and a model of the procedure’s delivery, the use of the VR simulation comprised a computer-mediated form of BST. Resources associated with the appropriate delivery of BST have often prevented its use in practice [<xref ref-type="bibr" rid="ref47">47</xref>]. Consequently, automating instructor-intensive portions of the practice may assist in disseminating effective training practices.</p>
        <fig id="figure1" position="float">
          <label>Figure 1</label>
          <caption>
            <p>Flowcharts depicting example of appropriate sequence of events in a scenario (top), steps in lesson 1 (middle), and steps in lesson 2 (bottom).</p>
          </caption>
          <graphic xlink:href="games_v10i4e41097_fig1.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <fig id="figure2" position="float">
          <label>Figure 2</label>
          <caption>
            <p>Web application page depicting tools used to design flowcharts and novel lessons. Lesson creation provides a drag and drop interface to allow the creation and connection of nodes for a flowchart. In addition, classifications can be assigned to each node. Once the flowchart is completed, the lesson creation page also allows the user to create individual lessons needed to run a simulation. VR: virtual reality.</p>
          </caption>
          <graphic xlink:href="games_v10i4e41097_fig2.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <fig id="figure3" position="float">
          <label>Figure 3</label>
          <caption>
            <p>Reports page depicting simulation feedback. The report includes all the information recorded by the simulation feedback. Having reports accessible allows the instructors to create personalized analyses for each trainee and create a profile to determine how effectively the trainee understands the presented material.</p>
          </caption>
          <graphic xlink:href="games_v10i4e41097_fig3.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <fig id="figure4" position="float">
          <label>Figure 4</label>
          <caption>
            <p>Depiction of basic virtual scenario and textual user prompt.</p>
          </caption>
          <graphic xlink:href="games_v10i4e41097_fig4.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
      <sec>
        <title>Procedures</title>
        <sec>
          <title>Baseline</title>
          <p>During the baseline session, the participants completed a brief demographic probe and the SKIL Survey. To acclimate the participants to VR, the participants completed a brief custom tutorial introducing them to concepts such as the need to depress and hold the right trigger while speaking as well as the appearance of onscreen prompts. The participants then completed 2 OMPs related to lessons 1 (ie, student avatar responds correctly) and 2 (ie, student avatar responds incorrectly). For both lessons, the initial prompt presented on the Oculus display—a math problem based on content commonly featured in 3rd grade mathematics—was “You have 5 fish bowls. There are 4 fish in each bowl. How many fish do you have total?” Together, the 2 OMPs evaluated the participants’ ability to follow best practice over 10 teacher responses. The OMP for each lesson terminated immediately following an incorrect response. Although the system classified and scored each participant, the session administrator performed classifications manually to ensure an accurate assessment of the performance of the participants. Regardless of when the OMP was terminated, the simulation displayed “This concludes the session” at the conclusion of the probe. No further feedback was provided.</p>
        </sec>
        <sec>
          <title>Training and Posttest Session</title>
          <sec>
            <title>Overview</title>
            <p>After the completion of the baseline assessments, the participants were randomly assigned to the control and experimental groups. Before assignment, we divided the entire sample into groups based on baseline OMP scores; members of these groups were then randomly assigned to the treatment conditions to ensure roughly equivalent baseline OMP scores for the control (mean 22, SD 4.140) and treatment groups (mean 22.67, SD 4.577). Sessions were conducted 1 week following baseline.</p>
          </sec>
          <sec>
            <title>Control</title>
            <p>The participants in the control condition watched a video-recorded lecture concerning the rationale and steps of the procedures for lessons 1 and 2. The lectures also included video models displaying educators using the procedures in practice with elementary-aged students. The lecture concluded with a description of the problem used in the OMP (ie, “You have 5 fishbowls…”) and a description of how the procedures would be applied to this specific problem. The duration of the lecture was approximately 12 minutes. Following the lecture, the participants completed the same OMP used during the baseline sessions. In addition, the participants completed a generalization OMP featuring a novel problem: “There are 4 buckets. There are 3 apples in each bucket. How many apples are there total?” The student avatar’s responses were adjusted to accommodate the new prompt. The generalization OMP terminated following the first incorrect response.</p>
          </sec>
          <sec>
            <title>Intervention</title>
            <p>The participants in the intervention group observed the same recorded lecture provided in the control condition. Thereafter, the participants received a series of supplemental VR trainings. For each lesson, the participants received 2 simulations of error-free prompting (EFPT), followed by 2 sessions of delayed prompting (DPT). EFPT simulations followed the general format of typical OMP; however, written examples of correct responses appeared on the screen immediately after each statement made by the student avatar. For DPT, prompts appeared on the screen following an incorrect response or nonresponse (ie, no response within 4 seconds). Immediately following each DPT, the simulation displayed the percentage of steps completed correctly and a description of the steps of each procedure missed (ie, performance feedback [<xref ref-type="bibr" rid="ref48">48</xref>]). Classifications of participant performance, prompts, and feedback were all managed by the simulation without input from the session administrator. The combined duration of the supplemental VR trainings was approximately 10 minutes. The participants completed both the acquisition and generalization OMPs following training.</p>
          </sec>
        </sec>
        <sec>
          <title>Maintenance</title>
          <p>One week following the posttest sessions, the participants from both groups completed an additional acquisition OMP and generalization OMP in accordance with the procedures observed in the baseline and posttest sessions. The participants also completed an additional SKIL Survey as well as an assessment related to the acceptability of the training.</p>
        </sec>
      </sec>
      <sec>
        <title>Analysis</title>
        <p>For OMPs, a 2-way mixed-design ANOVA was used. The analysis evaluated differences using a between-participants factor of treatment (control or intervention) and a within-participant factor of time (baseline, posttest, and maintenance sessions). Partial eta squared, η<italic><sub>p</sub></italic><sup>2</sup>, was used to indicate the extent of group differences, with values of 0.02, 0.13, and 0.26 representing small, moderate, and large effects, respectively [<xref ref-type="bibr" rid="ref49">49</xref>]. Statistically significant main effects, if observed, were followed by an analysis of simple effects using within- and independent samples <italic>t</italic> tests (2-tailed). Effect sizes were determined using Cohen <italic>d</italic>, with values of 0.8, 0.5, and 0.2 for large, medium, and small effects, respectively [<xref ref-type="bibr" rid="ref50">50</xref>]. Sphericity, normality, and homogeneity were evaluated using Mauchly, Shapiro-Wilk, and Levene tests, respectively.</p>
        <p>The differences between the SKIL Survey responses in the baseline and maintenance sessions were analyzed using the Mann-Whitney <italic>U</italic> test, a nonparametric alternative for comparing group differences [<xref ref-type="bibr" rid="ref50">50</xref>]. Effect sizes were determined using Cohen <italic>r</italic>, with scores exceeding 0.5 representing a large effect, scores between 0.49 and 0.3 representing a moderate effect, and scores between 0.29 and 0.1 representing a small effect [<xref ref-type="bibr" rid="ref51">51</xref>]. We initially examined differences in confidence, given that knowledge and usefulness ratings were likely to stem from didactic instruction (ie, information received by the participants rather than opportunities for practice), which did not differ between the 2 groups. In addition, the results of our previous research suggested that these 2 dimensions are insensitive to VR training [<xref ref-type="bibr" rid="ref13">13</xref>]. However, we compared the findings across the knowledge and usefulness scales as an exploratory analysis.</p>
        <p>Correspondence, defined as OMPs and VMP recording the same value (eg, correct or incorrect) for a participant’s response, was collected for each acquisition assessment, generalization assessment, and the VR simulations comprising the supplemental instruction. The calculations involved dividing the number of correspondences by the total number of responses and multiplying by 100.</p>
        <p>Multiple comparison corrections were conducted for the 15 a priori statistical tests and 4 additional post hoc tests using the Benjamini-Hochberg procedure [52] with a false-discovery rate of 10%. [<xref ref-type="bibr" rid="ref52">52</xref>] with a false-discovery rate of 10%. All raw <italic>P</italic> values, reported throughout, were significant following the Benjamini-Hochberg procedure unless indicated otherwise. All analyses were conducted using SPSS (IBM Corp).</p>
      </sec>
      <sec>
        <title>Interobserver Agreement</title>
        <p>Interobserver agreement (IOA) was collected across all phases of the project. Specifically, a doctoral-level faculty member (ie, the secondary observer) with experience observing the completion of the mathematical questioning procedure [<xref ref-type="bibr" rid="ref14">14</xref>] collected OMP data—including generalization probes—in 43% of the baseline sessions, 28% of the posttest sessions, and 20% of the maintenance sessions across treatment and control groups. The secondary observer’s results were compared with those of the session administrator. IOA was then calculated by dividing the number of agreements (ie, steps in the procedure in which observers recorded the same response) by the total number of steps in lessons 1 and 2 and multiplying the resultant number by 100%. The average IOA for the baseline and posttest sessions was 100% (SD 0%). The average IOA for the maintenance session was 100% for the experimental group and 93.33% (SD 9%; range 80%-100%) for the control group.</p>
      </sec>
      <sec>
        <title>Fidelity</title>
        <p>We assessed the experimental protocols across all conditions using the checklists featured in our previous work [<xref ref-type="bibr" rid="ref14">14</xref>]. The checklists indicated whether the session administrator delivered appropriate instructions, assessments, and simulation components. Fidelity was collected across numerous sessions in the baseline (43%), posttest (26%), and maintenance conditions (20%) and determined by calculating the percentage of steps for each session performed by the session administrator. The average baseline fidelity was 98.07% (SD 4.69%; range 87.50%-100%). In the posttest sessions, fidelity for the control and experimental groups was 100% and 95% (SD 5.77%; range 90%-100%), respectively. Fidelity across maintenance sessions was 100%.</p>
      </sec>
      <sec>
        <title>Acceptability</title>
        <p>During the maintenance session, we used a consumer satisfaction survey featured in previous studies [<xref ref-type="bibr" rid="ref13">13</xref>] to assess the acceptability of the simulation. The participants responded to statements concerning the project (ie, <italic>The use of VR was acceptable to me; I had no difficulty using VR</italic>) using a 6-item scale (1=<italic>strongly disagree</italic>; 6=<italic>strongly agree</italic>). The participants also answered a series of questions related to their experiences in the simulation.</p>
      </sec>
    </sec>
    <sec sec-type="results">
      <title>Results</title>
      <sec>
        <title>Overview</title>
        <p>Descriptive statistics for baseline, posttest, and maintenance variables are listed in <xref ref-type="table" rid="table3">Table 3</xref>.</p>
        <table-wrap position="float" id="table3">
          <label>Table 3</label>
          <caption>
            <p>Descriptive statistics for baseline, posttest, and maintenance variables across groups.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="30"/>
            <col width="30"/>
            <col width="440"/>
            <col width="170"/>
            <col width="170"/>
            <col width="160"/>
            <thead>
              <tr valign="top">
                <td colspan="3">Variable</td>
                <td>Total</td>
                <td>Control</td>
                <td>Intervention</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td colspan="6">
                  <bold>Pretest session</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="2">OMP<sup>a</sup> (percentage of correct responses), mean (SD); range</td>
                <td>22.33 (4.30); 20-30</td>
                <td>22 (4.14); 20-30</td>
                <td>22.67 (4.58); 20-30</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="5">
                  <bold>SKIL variables</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>Knowledge, mean (SD); range</td>
                <td>1.28 (0.47); 0.50-2.25</td>
                <td>1.48 (0.49); 0.63-2.25</td>
                <td>1.08 (0.37); 0.38-1.63</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>Confidence, mean (SD); range</td>
                <td>1.19 (0.61); 0-2.13</td>
                <td>1.42 (0.60); 0.13-2.25</td>
                <td>0.97 (0.54); 0-1.63</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>Usefulness, mean (SD); range</td>
                <td>1.73 (0.60); 0.38-2.75</td>
                <td>1.83 (0.60); 0.38-2.5</td>
                <td>1.63 (0.61); 0.5-2.75</td>
              </tr>
              <tr valign="top">
                <td colspan="6">
                  <bold>Posttest session</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="5">
                  <bold>OMP</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>Percentage of correct responses (% correct), mean (SD); range</td>
                <td>75.67 (22.08); 40-100</td>
                <td>63.33 (22.64); 50-100</td>
                <td>88.00 (22.62); 40-100</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>Generalization, percentage of correct responses, mean (SD); range</td>
                <td>76.33 (24.70); 30-100</td>
                <td>66.00 (22.62); 30-100</td>
                <td>86.67 (22.89); 50-100</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="5">
                  <bold>SKIL variables<sup>b</sup></bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>Knowledge, mean (SD); range</td>
                <td>2.36 (0.52); 1.25-3</td>
                <td>2.27 (0.53); 1.25-2.88</td>
                <td>2.45 (0.51); 1.5-3</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>Confidence, mean (SD); range</td>
                <td>2.23 (0.51); 1.38-2.88</td>
                <td>2.04 (0.52); 1.25-2.75</td>
                <td>2.41 (0.45); 1.5-2.88</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>Usefulness, mean (SD); range</td>
                <td>2.70 (0.32); 1.88-3</td>
                <td>2.68 (0.35); 1.88-3</td>
                <td>2.72 (0.30); 2-3</td>
              </tr>
              <tr valign="top">
                <td colspan="6">
                  <bold>Maintenance session</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="5">
                  <bold>OMP</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>Percentage of correct responses, mean (SD); range</td>
                <td>69 (24.96); 30-100</td>
                <td>54.67 (15.98); 30-100</td>
                <td>83.33 (24.40); 50-100</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>Generalization, percentage of correct responses, mean (SD); range</td>
                <td>72.33 (25.69); 30-100</td>
                <td>58 (20.07); 30-100</td>
                <td>86.67 (22.89); 50-100</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table3fn1">
              <p><sup>a</sup>OMP: observed mastery probe.</p>
            </fn>
            <fn id="table3fn2">
              <p><sup>b</sup>Knowledge, confidence, and usefulness were determined using 4-point scales from the SKIL Survey [<xref ref-type="bibr" rid="ref36">36</xref>].</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
      </sec>
      <sec>
        <title>OMP Assessment</title>
        <sec>
          <title>Acquisition</title>
          <p>The Mauchly test indicated that the assumption of sphericity (ie, the equality of variance among difference scores among all testing variables) was not violated (<italic>χ</italic><sup>2</sup><sub>2</sub>=0.6; <italic>P</italic>=.74). A Shapiro-Wilk test indicated that the distribution of assessment scores for both groups across the baseline, posttest, and maintenance OMP assessments violated the assumption of normality (<italic>P</italic>≤.02). Nonetheless, we performed a mixed-design ANOVA, given that previous data simulations [<xref ref-type="bibr" rid="ref53">53</xref>] suggested that ANOVA remains robust when data are not normally distributed. For the baseline and postintervention outcomes for the OMPs, a Levene test indicated that all the measures met the assumption of homogeneity. However, the results of the Levene test suggested that the maintenance scores violated the assumption of homogeneity (<italic>P</italic>=.04). Nonetheless, an ANOVA was performed, given that it is generally robust against violations of homogeneity when sample sizes are equal [<xref ref-type="bibr" rid="ref54">54</xref>].</p>
          <p>We analyzed the data using a mixed-design ANOVA with a between-participants factor of treatment (control and intervention) and within-participants factor of time (baseline, posttest, and maintenance sessions). Large main effects of time (<italic>F</italic><sub>2,27</sub>=124.154; <italic>P&#60;</italic>.001; η<italic><sub>p</sub></italic><sup>2</sup>=0.816) and treatment (<italic>F</italic><sub>1,28</sub>=19.281; <italic>P&#60;</italic>.001; η<italic><sub>p</sub></italic><sup>2</sup>=0.408), as well as the interaction effect (<italic>F</italic><sub>2,28</sub>=8.429; <italic>P&#60;</italic>.001; η<italic><sub>p</sub></italic><sup>2</sup>=0.231) for the OMPs were significant, suggesting a difference in performance between the 2 groups at each time point. Subsequent simple effects tests of within- and between-subjects scores were performed to determine whether the 2 randomly equivalent groups differed.</p>
          <p>Within-samples <italic>t</italic> tests revealed a large, significant improvement for the control group between the baseline and posttest sessions (<italic>t</italic><sub>14</sub>=−10.313; <italic>P</italic>&#60;.001; Cohen <italic>d</italic>=2.66) and a significant decrease in performance between the posttest and maintenance sessions (<italic>t</italic><sub>14</sub>=2.303; <italic>P</italic>=.02; Cohen <italic>d</italic>=−0.595). Similarly, the intervention group exhibited a large, significant improvement in performance between the baseline and posttest sessions (<italic>t</italic><sub>14</sub>=−11.859; <italic>P</italic>&#60;.001; Cohen <italic>d</italic>=3.062); however, differences between the posttest and maintenance sessions were not significant (<italic>t</italic><sub>14</sub>=0.699; <italic>P</italic>=.20), reflecting more stable performance across the 2 probes.</p>
          <p>We also performed independent samples <italic>t</italic> tests comparing the performance of the control and intervention groups at each time point. Differences in baseline acquisition OMP were not significant (<italic>t</italic><sub>28</sub>=0.418; <italic>P</italic>=.40). However, differences between the intervention and control groups were both large and significant at the posttest (<italic>t</italic><sub>28</sub>=3.653; <italic>P</italic>&#60;.001; Cohen <italic>d</italic>=1.334) and maintenance sessions (<italic>t</italic><sub>28</sub>=3.807; <italic>P</italic>&#60;.001; Cohen <italic>d</italic>=1.39), suggesting that the VR simulation increased scores relative to the participants who exclusively received the lecture.</p>
        </sec>
        <sec>
          <title>Generalization</title>
          <p>Within-samples <italic>t</italic> tests on the generalization OMP revealed a moderate, significant decrease between the posttest and maintenance probes for the control group (<italic>t</italic><sub>14</sub>=1.824; <italic>P</italic>=.045; Cohen <italic>d</italic>=−0.471). Changes between the posttest and maintenance sessions for the intervention group were not significant (<italic>t</italic><sub>14</sub>=0; <italic>P=</italic>.50). Independent samples <italic>t</italic> tests revealed robust, significantly higher scores for the intervention group at both the posttest (<italic>t</italic><sub>28</sub>=2.488; <italic>P</italic>=.01; Cohen <italic>d</italic>=0.908) and maintenance sessions (<italic>t</italic><sub>28</sub>=3.647; <italic>P</italic>&#60;.001; Cohen <italic>d</italic>=1.332).</p>
        </sec>
      </sec>
      <sec>
        <title>SKIL Survey</title>
        <p>The participants ranked their knowledge, confidence, and understanding of 8 criteria pertaining to the questioning procedure during the baseline and maintenance sessions using the SKIL Survey. We averaged the 8 dimensions of each value across each domain (<xref ref-type="table" rid="table3">Table 3</xref>). The treatment group reported lower ratings across all scales, relative to the control group, before the intervention. Following the intervention, the ratings across all scales were higher for the treatment group. Statistical comparisons of ratings at baseline and maintenance, performed using the Mann-Whitney <italic>U</italic> test, were initially limited to the confidence domain. The control group exhibited small, significantly higher confidence ratings than the intervention group at baseline, with <italic>U</italic>=64, <italic>P</italic>=.04, and Cohen <italic>r</italic>=0.142. At maintenance, the intervention group exhibited small, significantly higher scores than the control group, <italic>U</italic>=64, <italic>P</italic>=.04, Cohen <italic>r</italic>=0.137. However, inclusion of the knowledge and usefulness scales in the statistical analyses resulted in insignificant adjusted <italic>P</italic> values across all scales, including confidence. Following the Benjamini-Hochberg procedure, we observed no significant differences between knowledge and usefulness either before (<italic>U</italic>=57, <italic>P</italic>=.02 and <italic>U</italic>=83, <italic>P</italic>=.22) or after the intervention (<italic>U</italic>=85, <italic>P</italic>=.25 and <italic>U</italic>=107, <italic>P</italic>=.82).</p>
      </sec>
      <sec>
        <title>Correspondence</title>
        <p>Across all conditions and groups, the average correspondence between the acquisition OMP and VMP was 95.98% (SD 7.44%; range 71.43%-100%). The correspondence between generalization OMP and VMP was slightly lower (mean 92.44%, SD 10.30%; range 66.67%-100%). Although not included as measures of performance, we also collected observation data during the probes conducted as part of the intervention (ie, EFPT and DPT). The correspondence between the observed and automated measures during the intervention was high (mean 98.03%, SD 2.96%; range 90.48%-100%).</p>
      </sec>
      <sec>
        <title>Acceptability</title>
        <p>Both the treatment (mean 5.73, SD 0.59; range 4-6) and control (mean 5.65, SD 0.82; range 4-6) groups provided high acceptability ratings for the VR portions of their conditions. The treatment (mean 6) and control (mean 5.87, SD 0.35; range 5-6) groups likewise agreed that they had no difficulty using VR.</p>
      </sec>
    </sec>
    <sec sec-type="discussion">
      <title>Discussion</title>
      <sec>
        <title>Principal Findings</title>
        <p>This study compared the effectiveness of a training package featuring VR with didactic instruction as a means of teaching steps in a mathematical questioning strategy. Although participant performance improved following both forms of instruction, the results suggest that gains of the control group deteriorated during maintenance. Differences in performance between the posttest and maintenance sessions favored the VR group, whose scores were significantly higher than those of the participants who received didactic instruction exclusively. A similar pattern of performance was observed for untaught generalization measures. Notwithstanding the results of exploratory analyses featuring all the SKIL Survey scales, the results further suggest that VR contributed to higher confidence in the performance of the procedure. The correspondence between the measures of performance administered by human observers and those administered by AI was generally high. These positive findings, combined with favorable acceptability ratings, support broader applications of VR in education and provide avenues for future inquiry.</p>
        <p>Differences observed between the treatment and control groups, although consistent with the positive effects observed in recent literature involving education and VR, were more pronounced in this study than in many previous studies [<xref ref-type="bibr" rid="ref17">17</xref>,<xref ref-type="bibr" rid="ref55">55</xref>]. This is likely because of the relatively low responses of participants in the baseline OMP, which mitigated the ceiling effects imposed by the primary measure. In addition, our VR training adapted an evidence-based approach to personnel preparation [<xref ref-type="bibr" rid="ref29">29</xref>]. Although many simulations are premised on the belief that engagement in a simulated activity with little immediate guidance is beneficial to the learner [<xref ref-type="bibr" rid="ref56">56</xref>], the findings from this study provide further support for immediate feedback associated with behavioral teaching methods and facilitated through automation [<xref ref-type="bibr" rid="ref57">57</xref>]. Likewise, the high acceptability of VR across groups corresponds with the growing body of research [<xref ref-type="bibr" rid="ref50">50</xref>] suggesting that modern VR hardware and approaches to simulation have alleviated motion sickness and other issues associated with earlier VR applications in education [<xref ref-type="bibr" rid="ref15">15</xref>].</p>
        <p>Given that the participants in previous studies required days of exposure to the simulation before mastering the procedure [<xref ref-type="bibr" rid="ref14">14</xref>], the extent to which the treatment group participants acquired the procedure following a single session was surprising. The findings further suggest that the participants in the control group scored significantly lower on maintenance assessments, whereas scores in the intervention group did not significantly deteriorate. These results must be placed in the context of the limited number of items included in this experiment; nonetheless, the finding that simulation facilitated individualized skill rehearsal—often difficult to arrange in instructor-administered professional development and teacher education programs—provides substantial support for the use of automated opportunities for rehearsal as a supplement to typical instruction. Similar results in the generalization OMP likewise provide qualified support for the VR condition and support the contention that the participants were not merely memorizing appropriate responses based on the original problem. Nonetheless, future work will need to demonstrate the effect of the intervention on a wider range of problems and in practice.</p>
        <p>Comparisons between OMPs and VMP revealed acceptable levels of agreement across the conditions. However, the disparities across conditions (ie, higher correspondence in prompting conditions relative to assessments) suggest that the feasibility of AI assessment in professional development, in the absence of extensive classification training, should vary based on the objectives of instruction. That is, the classifier used in this study appears to be suitable for procedures that require minimal deviation from a structured protocol or for determining the extent to which trainees exhibit statements closely aligned with training. As most trainings typically do not extensively assess individuals before instruction (ie, during baseline) and are designed to encourage the exhibition of targeted skills, the capabilities of the current automated system may be appropriate for the typical training context.</p>
      </sec>
      <sec>
        <title>Limitations</title>
        <p>This study has several notable limitations. The small convenience sample comprised students from a number of backgrounds that differed considerably from many professionals in education. Therefore, the results may not resemble those likely to be achieved among the targeted population. Given our research questions and the early stage of this scholarship, our emphasis on functionality, rather than external validity, is nonetheless appropriate. In addition, the VR group received more exposure to the procedure than the control group, whose participants did not receive a conventional alternative to the rehearsal provided in VR. However, the more passive training provided to the control group is representative of the instruction that appears in many preservice programs [<xref ref-type="bibr" rid="ref1">1</xref>] and in-service professional development trainings [<xref ref-type="bibr" rid="ref2">2</xref>]. The comparison in this study is appropriate because the primary purpose of AI-enhanced VR is to provide opportunities for rehearsal in instructional situations where individualized role-play is not possible. Given the emphasis on speech, we could have implemented the active components of the training using a less immersive platform (eg, a desktop computer). Nonetheless, the current integration of VR and AI contributes to the literature, given (1) the common view that immersion alone provides a benefit to the learner [<xref ref-type="bibr" rid="ref38">38</xref>] and (2) the limited work regarding the use of AI and VR in teacher training [<xref ref-type="bibr" rid="ref22">22</xref>]. Additional research is needed to compare immersive simulations with more conventional training approaches and explore the impact of emerging technologies on teacher education and professional development.</p>
      </sec>
      <sec>
        <title>Future Directions</title>
        <p>The current VR simulation demonstrates the feasibility of providing instruction in teaching methods using an automated version of an evidence-based training method (ie, BST). Additional work is needed to demonstrate positive effects across a broader range of procedures and settings. The current system analyzes the user based on speech input, which is valuable given the heavy emphasis placed on verbal communication in education. However, the opportunities VR provides to analyze head movement, controller positions, and gaze are what separate the technology from more common platforms. VR training provides opportunities to rehearse behaviors used in practice [<xref ref-type="bibr" rid="ref58">58</xref>,<xref ref-type="bibr" rid="ref59">59</xref>] rather than button pressing or other distal representations of authentic performance [<xref ref-type="bibr" rid="ref13">13</xref>]. Incorporating motion sensing and speech recognition into future work can provide opportunities to train a wide range of complex skills.</p>
        <p>Demonstrating the ability of VR-based instruction to promote generalization beyond simulated environments to authentic settings remains a fundamental challenge for the medium [<xref ref-type="bibr" rid="ref58">58</xref>]. Behavioral theories of learning suggest that prompts and reinforcers can be paired with a variety of antecedents (ie, multiple exemplars) to create antecedent stimulus classes that should nonetheless produce the same response from the learner [<xref ref-type="bibr" rid="ref39">39</xref>]. This has implications for VR instruction, as learners must (1) be capable of generalizing skills learned in simulations to the actual performance context and (2) apply targeted skills when confronted with situations that do not precisely resemble the situations addressed in training. The ability of VR to alter aspects of a learning simulation across repeated uses (eg, avatar behavior and appearance) has the potential to assist practitioners in generalizing their skills [<xref ref-type="bibr" rid="ref7">7</xref>]. Randomizing student avatar characteristics (eg, gender and race) may also prevent the bias associated with repeatedly pairing specific types of student behavior with a specific student profile [<xref ref-type="bibr" rid="ref59">59</xref>]. Addressing such issues will require research that stretches beyond the skills and application contexts featured in this study.</p>
      </sec>
      <sec>
        <title>Conclusions</title>
        <p>The findings of this study suggest that an automated, structured approach to VR can improve the acquisition of an educational procedure and participant confidence relative to more conventional, didactic methods. The participants further reported that VR was acceptable and easy to use. Automated assessments of performance generally corresponded to observations conducted by researchers, particularly in conditions where the probes were preceded by guidance regarding appropriate responses. Although promising, additional work is required to explore the effects of AI-enhanced VR on more complex procedures and the cascading effect of such training on practitioners in the field.</p>
      </sec>
    </sec>
  </body>
  <back>
    <app-group/>
    <glossary>
      <title>Abbreviations</title>
      <def-list>
        <def-item>
          <term id="abb1">AI</term>
          <def>
            <p>artificial intelligence</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb2">BST</term>
          <def>
            <p>behavioral skills training</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb3">DPT</term>
          <def>
            <p>delayed prompting</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb4">EFPT</term>
          <def>
            <p>error-free prompting</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb5">IOA</term>
          <def>
            <p>interobserver agreement</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb6">OMP</term>
          <def>
            <p>observed mastery probe</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb7">VMP</term>
          <def>
            <p>virtual mastery probe</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb8">VR</term>
          <def>
            <p>virtual reality</p>
          </def>
        </def-item>
      </def-list>
    </glossary>
    <ack>
      <p>The authors wish to thank Drs Guadalupe Canahuate and Anton Kruger of the University of Iowa for their feedback and guidance. This study was supported by research grants from the Iowa Initiative for Artificial Intelligence and the Obermann Center for Advanced Studies.</p>
    </ack>
    <fn-group>
      <fn fn-type="conflict">
        <p>None declared.</p>
      </fn>
    </fn-group>
    <ref-list>
      <ref id="ref1">
        <label>1</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Anderson</surname>
              <given-names>LM</given-names>
            </name>
            <name name-style="western">
              <surname>Stillman</surname>
              <given-names>JA</given-names>
            </name>
          </person-group>
          <article-title>Student teaching’s contribution to preservice teacher development: a review of research focused on the preparation of teachers for urban and high-needs contexts</article-title>
          <source>Rev Educ Res</source>
          <year>2013</year>
          <month>03</month>
          <day>01</day>
          <volume>83</volume>
          <issue>1</issue>
          <fpage>3</fpage>
          <lpage>69</lpage>
          <pub-id pub-id-type="doi">10.3102/0034654312468619</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref2">
        <label>2</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Yon</surname>
              <given-names>KS</given-names>
            </name>
            <name name-style="western">
              <surname>Duncan</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Wen-Yu Lee</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Scarloss</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Shapley</surname>
              <given-names>KL</given-names>
            </name>
          </person-group>
          <article-title>Reviewing the Evidence On How Teacher Professional Development Affects Student Achievement</article-title>
          <source>U.S. Department of Education, Institute of Education Sciences, National Center for Education Evaluation and Regional Assistance, Regional Educational Laboratory Southwest</source>
          <year>2007</year>
          <month>10</month>
          <access-date>2022-09-10</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://ies.ed.gov/ncee/edlabs/regions/southwest/pdf/REL_2007033.pdf">https://ies.ed.gov/ncee/edlabs/regions/southwest/pdf/REL_2007033.pdf</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref3">
        <label>3</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Reid</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>O'Kane</surname>
              <given-names>NP</given-names>
            </name>
            <name name-style="western">
              <surname>Macurik</surname>
              <given-names>KM</given-names>
            </name>
          </person-group>
          <person-group person-group-type="editor">
            <name name-style="western">
              <surname>Fisher</surname>
              <given-names>WW</given-names>
            </name>
            <name name-style="western">
              <surname>Piazza</surname>
              <given-names>CC</given-names>
            </name>
            <name name-style="western">
              <surname>Roane</surname>
              <given-names>HS</given-names>
            </name>
          </person-group>
          <article-title>Staff training and management</article-title>
          <source>Handbook of Applied Behavior Analysis</source>
          <year>2011</year>
          <publisher-loc>New York, NY, USA</publisher-loc>
          <publisher-name>The Guilford Press</publisher-name>
          <fpage>281</fpage>
          <lpage>94</lpage>
        </nlm-citation>
      </ref>
      <ref id="ref4">
        <label>4</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Sawyer</surname>
              <given-names>MR</given-names>
            </name>
            <name name-style="western">
              <surname>Andzik</surname>
              <given-names>NR</given-names>
            </name>
            <name name-style="western">
              <surname>Kranak</surname>
              <given-names>MP</given-names>
            </name>
            <name name-style="western">
              <surname>Willke</surname>
              <given-names>CP</given-names>
            </name>
            <name name-style="western">
              <surname>Curiel</surname>
              <given-names>ES</given-names>
            </name>
            <name name-style="western">
              <surname>Hensley</surname>
              <given-names>LE</given-names>
            </name>
            <name name-style="western">
              <surname>Neef</surname>
              <given-names>NA</given-names>
            </name>
          </person-group>
          <article-title>Improving pre-service teachers' performance skills through behavioral skills training</article-title>
          <source>Behav Anal Pract</source>
          <year>2017</year>
          <month>09</month>
          <volume>10</volume>
          <issue>3</issue>
          <fpage>296</fpage>
          <lpage>300</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/29021942"/>
          </comment>
          <pub-id pub-id-type="doi">10.1007/s40617-017-0198-4</pub-id>
          <pub-id pub-id-type="medline">29021942</pub-id>
          <pub-id pub-id-type="pii">198</pub-id>
          <pub-id pub-id-type="pmcid">PMC5622009</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref5">
        <label>5</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Knight</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>van Nieuwerburgh</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>Instructional coaching: a focus on practice</article-title>
          <source>Coaching</source>
          <year>2012</year>
          <month>09</month>
          <volume>5</volume>
          <issue>2</issue>
          <fpage>100</fpage>
          <lpage>12</lpage>
          <pub-id pub-id-type="doi">10.1080/17521882.2012.707668</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref6">
        <label>6</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Severtson</surname>
              <given-names>JM</given-names>
            </name>
            <name name-style="western">
              <surname>Carr</surname>
              <given-names>JE</given-names>
            </name>
          </person-group>
          <article-title>Training novice instructors to implement errorless discrete-trial teaching: a sequential analysis</article-title>
          <source>Behav Anal Pract</source>
          <year>2012</year>
          <volume>5</volume>
          <issue>2</issue>
          <fpage>13</fpage>
          <lpage>23</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/23730463"/>
          </comment>
          <pub-id pub-id-type="doi">10.1007/BF03391820</pub-id>
          <pub-id pub-id-type="medline">23730463</pub-id>
          <pub-id pub-id-type="pmcid">PMC3592485</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref7">
        <label>7</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Dempsey</surname>
              <given-names>CM</given-names>
            </name>
            <name name-style="western">
              <surname>Iwata</surname>
              <given-names>BA</given-names>
            </name>
            <name name-style="western">
              <surname>Fritz</surname>
              <given-names>JN</given-names>
            </name>
            <name name-style="western">
              <surname>Rolider</surname>
              <given-names>NU</given-names>
            </name>
          </person-group>
          <article-title>Observer training revisited: a comparison of in vivo and video instruction</article-title>
          <source>J Appl Behav Anal</source>
          <year>2012</year>
          <volume>45</volume>
          <issue>4</issue>
          <fpage>827</fpage>
          <lpage>32</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/23322937"/>
          </comment>
          <pub-id pub-id-type="doi">10.1901/jaba.2012.45-827</pub-id>
          <pub-id pub-id-type="medline">23322937</pub-id>
          <pub-id pub-id-type="pii">188-12</pub-id>
          <pub-id pub-id-type="pmcid">PMC3545506</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref8">
        <label>8</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Bastian</surname>
              <given-names>KC</given-names>
            </name>
            <name name-style="western">
              <surname>Patterson</surname>
              <given-names>KM</given-names>
            </name>
            <name name-style="western">
              <surname>Carpenter</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>Placed for success: which teachers benefit from high-quality student teaching placements?</article-title>
          <source>Educ Policy</source>
          <year>2020</year>
          <month>08</month>
          <day>18</day>
          <volume>36</volume>
          <issue>7</issue>
          <fpage>1583</fpage>
          <lpage>611</lpage>
          <pub-id pub-id-type="doi">10.1177/0895904820951126</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref9">
        <label>9</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Cook</surname>
              <given-names>BG</given-names>
            </name>
            <name name-style="western">
              <surname>Cook</surname>
              <given-names>SC</given-names>
            </name>
          </person-group>
          <article-title>Unraveling evidence-based practices in special education</article-title>
          <source>J Spec Educ</source>
          <year>2011</year>
          <month>09</month>
          <day>08</day>
          <volume>47</volume>
          <issue>2</issue>
          <fpage>71</fpage>
          <lpage>82</lpage>
          <pub-id pub-id-type="doi">10.1177/0022466911420877</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref10">
        <label>10</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Suh</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Prophet</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>The state of immersive technology research: a literature analysis</article-title>
          <source>Comput Human Behav</source>
          <year>2018</year>
          <month>09</month>
          <volume>86</volume>
          <fpage>77</fpage>
          <lpage>90</lpage>
          <pub-id pub-id-type="doi">10.1016/j.chb.2018.04.019</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref11">
        <label>11</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Frank</surname>
              <given-names>JA</given-names>
            </name>
            <name name-style="western">
              <surname>Kapila</surname>
              <given-names>V</given-names>
            </name>
          </person-group>
          <article-title>Mixed-reality learning environments: integrating mobile interfaces with laboratory test-beds</article-title>
          <source>Comput Educ</source>
          <year>2017</year>
          <month>07</month>
          <volume>110</volume>
          <fpage>88</fpage>
          <lpage>104</lpage>
          <pub-id pub-id-type="doi">10.1016/j.compedu.2017.02.009</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref12">
        <label>12</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ke</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Xu</surname>
              <given-names>X</given-names>
            </name>
          </person-group>
          <article-title>Teaching training in a mixed-reality integrated learning environment</article-title>
          <source>Comput Human Behav</source>
          <year>2016</year>
          <month>09</month>
          <volume>62</volume>
          <fpage>212</fpage>
          <lpage>20</lpage>
          <pub-id pub-id-type="doi">10.1016/j.chb.2016.03.094</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref13">
        <label>13</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>King</surname>
              <given-names>SA</given-names>
            </name>
            <name name-style="western">
              <surname>Dzenga</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Burch</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Kennedy</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>Teaching partial-interval recording of problem behavior with virtual reality</article-title>
          <source>J Behav Educ</source>
          <year>2020</year>
          <month>01</month>
          <day>04</day>
          <volume>30</volume>
          <issue>2</issue>
          <fpage>202</fpage>
          <lpage>25</lpage>
          <pub-id pub-id-type="doi">10.1007/s10864-019-09363-4</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref14">
        <label>14</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>King</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Estapa</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Bell</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Boyer</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Behavioral skills training through smart virtual reality: demonstration of feasibility for a verbal mathematical questioning strategy</article-title>
          <source>J Behav Educ (forthcoming)</source>
          <year>2022</year>
          <month>09</month>
          <day>16</day>
          <pub-id pub-id-type="doi">10.1007/s10864-022-09492-3</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref15">
        <label>15</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Jensen</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Konradsen</surname>
              <given-names>F</given-names>
            </name>
          </person-group>
          <article-title>A review of the use of virtual reality head-mounted displays in education and training</article-title>
          <source>Educ Inf Technol</source>
          <year>2017</year>
          <month>11</month>
          <day>25</day>
          <volume>23</volume>
          <issue>4</issue>
          <fpage>1515</fpage>
          <lpage>29</lpage>
          <pub-id pub-id-type="doi">10.1007/s10639-017-9676-0</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref16">
        <label>16</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Butt</surname>
              <given-names>AL</given-names>
            </name>
            <name name-style="western">
              <surname>Kardong-Edgren</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Ellertson</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Using game-based virtual reality with haptics for skill acquisition</article-title>
          <source>Clin Simul Nurs</source>
          <year>2018</year>
          <month>03</month>
          <volume>16</volume>
          <fpage>25</fpage>
          <lpage>32</lpage>
          <pub-id pub-id-type="doi">10.1016/j.ecns.2017.09.010</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref17">
        <label>17</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Yu</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Xu</surname>
              <given-names>W</given-names>
            </name>
          </person-group>
          <article-title>A meta‐analysis and systematic review of the effect of virtual reality technology on users' learning outcomes</article-title>
          <source>Comp Applic In Engineering</source>
          <year>2022</year>
          <month>05</month>
          <day>19</day>
          <volume>30</volume>
          <issue>5</issue>
          <fpage>1470</fpage>
          <lpage>84</lpage>
          <pub-id pub-id-type="doi">10.1002/cae.22532</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref18">
        <label>18</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Stavroulia</surname>
              <given-names>KE</given-names>
            </name>
            <name name-style="western">
              <surname>Makri-Botsari</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Psycharis</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Kekkeris</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <article-title>Emotional experiences in simulated classroom training environments</article-title>
          <source>Int J Inf Learn Technol</source>
          <year>2016</year>
          <volume>33</volume>
          <issue>3</issue>
          <fpage>172</fpage>
          <lpage>85</lpage>
          <pub-id pub-id-type="doi">10.1108/ijilt-10-2015-0030</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref19">
        <label>19</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Clay</surname>
              <given-names>CJ</given-names>
            </name>
            <name name-style="western">
              <surname>Schmitz</surname>
              <given-names>BA</given-names>
            </name>
            <name name-style="western">
              <surname>Balakrishnan</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Hopfenblatt</surname>
              <given-names>JP</given-names>
            </name>
            <name name-style="western">
              <surname>Evans</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Kahng</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Feasibility of virtual reality behavior skills training for preservice clinicians</article-title>
          <source>J Appl Behav Anal</source>
          <year>2021</year>
          <month>04</month>
          <volume>54</volume>
          <issue>2</issue>
          <fpage>547</fpage>
          <lpage>65</lpage>
          <pub-id pub-id-type="doi">10.1002/jaba.809</pub-id>
          <pub-id pub-id-type="medline">33482023</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref20">
        <label>20</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>González-Calatayud</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Prendes-Espinosa</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Roig-Vila</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>Artificial intelligence for student assessment: a systematic review</article-title>
          <source>Appl Sci</source>
          <year>2021</year>
          <month>06</month>
          <day>12</day>
          <volume>11</volume>
          <issue>12</issue>
          <fpage>5467</fpage>
          <pub-id pub-id-type="doi">10.3390/app11125467</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref21">
        <label>21</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Akgun</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Greenhow</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>Artificial intelligence in education: addressing ethical challenges in K-12 settings</article-title>
          <source>AI Ethics</source>
          <year>2022</year>
          <month>06</month>
          <day>12</day>
          <volume>2</volume>
          <issue>3</issue>
          <fpage>431</fpage>
          <lpage>40</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/34790956"/>
          </comment>
          <pub-id pub-id-type="doi">10.1007/s43681-021-00096-7</pub-id>
          <pub-id pub-id-type="medline">34790956</pub-id>
          <pub-id pub-id-type="pii">96</pub-id>
          <pub-id pub-id-type="pmcid">PMC8455229</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref22">
        <label>22</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Holmes</surname>
              <given-names>W</given-names>
            </name>
          </person-group>
          <person-group person-group-type="editor">
            <name name-style="western">
              <surname>Tatnall</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Artificial intelligence in education</article-title>
          <source>Encyclopedia of Education and Information Technologies</source>
          <year>2020</year>
          <publisher-loc>Cham, Switzerland</publisher-loc>
          <publisher-name>Springer</publisher-name>
          <fpage>88</fpage>
          <lpage>103</lpage>
        </nlm-citation>
      </ref>
      <ref id="ref23">
        <label>23</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Mousavinasab</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Zarifsanaiey</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>R. Niakan Kalhori</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Rakhshan</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Keikha</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Ghazi Saeedi</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Intelligent tutoring systems: a systematic review of characteristics, applications, and evaluation methods</article-title>
          <source>Interact Learn Environ</source>
          <year>2021</year>
          <volume>29</volume>
          <issue>1</issue>
          <fpage>142</fpage>
          <lpage>63</lpage>
          <pub-id pub-id-type="doi">10.1080/10494820.2018.1558257</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref24">
        <label>24</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Afzal</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Dempsey</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>D'Helon</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Mukhi</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Pribic</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Sickler</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Strong</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Vanchiswar</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Wilde</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <article-title>The personality of AI systems in education: experiences with the Watson tutor, a one-on-one virtual tutoring system</article-title>
          <source>Child Educ</source>
          <year>2019</year>
          <month>01</month>
          <day>16</day>
          <volume>95</volume>
          <issue>1</issue>
          <fpage>44</fpage>
          <lpage>52</lpage>
          <pub-id pub-id-type="doi">10.1080/00094056.2019.1565809</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref25">
        <label>25</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lamb</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Etopio</surname>
              <given-names>E</given-names>
            </name>
          </person-group>
          <person-group person-group-type="editor">
            <name name-style="western">
              <surname>Bradley</surname>
              <given-names>E</given-names>
            </name>
          </person-group>
          <article-title>Virtual reality to train preservice teachers</article-title>
          <source>Games and Simulations in Teacher Education</source>
          <year>2020</year>
          <publisher-loc>Cham, Switzerland</publisher-loc>
          <publisher-name>Springer</publisher-name>
          <fpage>141</fpage>
          <lpage>54</lpage>
        </nlm-citation>
      </ref>
      <ref id="ref26">
        <label>26</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Rittle-Johnson</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Loehr</surname>
              <given-names>AM</given-names>
            </name>
            <name name-style="western">
              <surname>Durkin</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>Promoting self-explanation to improve mathematics learning: a meta-analysis and instructional design principles</article-title>
          <source>ZDM</source>
          <year>2017</year>
          <month>1</month>
          <day>19</day>
          <volume>49</volume>
          <issue>4</issue>
          <fpage>599</fpage>
          <lpage>611</lpage>
          <pub-id pub-id-type="doi">10.1007/s11858-017-0834-z</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref27">
        <label>27</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Martino</surname>
              <given-names>AM</given-names>
            </name>
            <name name-style="western">
              <surname>Maher</surname>
              <given-names>CA</given-names>
            </name>
          </person-group>
          <article-title>Teacher questioning to promote justification and generalization in mathematics: what research practice has taught us</article-title>
          <source>J Math Behav</source>
          <year>1999</year>
          <month>3</month>
          <volume>18</volume>
          <issue>1</issue>
          <fpage>53</fpage>
          <lpage>78</lpage>
          <pub-id pub-id-type="doi">10.1016/s0732-3123(99)00017-6</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref28">
        <label>28</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Garderen</surname>
              <given-names>DV</given-names>
            </name>
            <name name-style="western">
              <surname>Scheuermann</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Jackson</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Hampton</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>Supporting the collaboration of special educators and general educators to teach students who struggle with mathematics: an overview of the research</article-title>
          <source>Psychol Schs</source>
          <year>2009</year>
          <month>01</month>
          <volume>46</volume>
          <issue>1</issue>
          <fpage>56</fpage>
          <lpage>78</lpage>
          <pub-id pub-id-type="doi">10.1002/pits.20354</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref29">
        <label>29</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kirkpatrick</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Akers</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Rivera</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <article-title>Use of behavioral skills training with teachers: a systematic review</article-title>
          <source>J Behav Educ</source>
          <year>2019</year>
          <month>3</month>
          <day>28</day>
          <volume>28</volume>
          <issue>3</issue>
          <fpage>344</fpage>
          <lpage>61</lpage>
          <pub-id pub-id-type="doi">10.1007/s10864-019-09322-z</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref30">
        <label>30</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hogan</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Knez</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Kahng</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Evaluating the use of behavioral skills training to improve school staffs’ implementation of behavior intervention plans</article-title>
          <source>J Behav Educ</source>
          <year>2014</year>
          <month>10</month>
          <day>7</day>
          <volume>24</volume>
          <issue>2</issue>
          <fpage>242</fpage>
          <lpage>54</lpage>
          <pub-id pub-id-type="doi">10.1007/s10864-014-9213-9</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref31">
        <label>31</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Akers</surname>
              <given-names>JS</given-names>
            </name>
            <name name-style="western">
              <surname>Pyle</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Higbee</surname>
              <given-names>TS</given-names>
            </name>
            <name name-style="western">
              <surname>Pyle</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Gerencser</surname>
              <given-names>KR</given-names>
            </name>
          </person-group>
          <article-title>A synthesis of script fading effects with individuals with autism spectrum disorder: a 20-year review</article-title>
          <source>Rev J Autism Dev Disord</source>
          <year>2015</year>
          <month>10</month>
          <day>30</day>
          <volume>3</volume>
          <issue>1</issue>
          <fpage>1</fpage>
          <lpage>17</lpage>
          <pub-id pub-id-type="doi">10.1007/s40489-015-0062-9</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref32">
        <label>32</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Cengher</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Budd</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Farrell</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Fienup</surname>
              <given-names>DM</given-names>
            </name>
          </person-group>
          <article-title>A review of prompt-fading procedures: implications for effective and efficient skill acquisition</article-title>
          <source>J Dev Phys Disabil</source>
          <year>2018</year>
          <volume>30</volume>
          <issue>2</issue>
          <fpage>155</fpage>
          <lpage>73</lpage>
          <pub-id pub-id-type="doi">10.1007/s10882-017-9575-8</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref33">
        <label>33</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Reed</surname>
              <given-names>FD</given-names>
            </name>
            <name name-style="western">
              <surname>Erath</surname>
              <given-names>TG</given-names>
            </name>
            <name name-style="western">
              <surname>Brand</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Novak</surname>
              <given-names>MD</given-names>
            </name>
          </person-group>
          <person-group person-group-type="editor">
            <name name-style="western">
              <surname>Fischer</surname>
              <given-names>AJ</given-names>
            </name>
            <name name-style="western">
              <surname>Collins</surname>
              <given-names>TA</given-names>
            </name>
            <name name-style="western">
              <surname>Dart</surname>
              <given-names>EH</given-names>
            </name>
            <name name-style="western">
              <surname>Radley</surname>
              <given-names>KC</given-names>
            </name>
          </person-group>
          <article-title>Video modeling during coaching and performance feedback</article-title>
          <source>Technology Applications in School Psychology Consultation, Supervision, and Training</source>
          <year>2018</year>
          <publisher-loc>New York, NY, USA</publisher-loc>
          <publisher-name>Routledge</publisher-name>
          <fpage>46</fpage>
          <lpage>61</lpage>
        </nlm-citation>
      </ref>
      <ref id="ref34">
        <label>34</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Horner</surname>
              <given-names>RH</given-names>
            </name>
            <name name-style="western">
              <surname>Carr</surname>
              <given-names>EG</given-names>
            </name>
            <name name-style="western">
              <surname>Halle</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>McGee</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Odom</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Wolery</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>The use of single-subject research to identify evidence-based practice in special education</article-title>
          <source>Except Child</source>
          <year>2005</year>
          <month>1</month>
          <volume>71</volume>
          <issue>2</issue>
          <fpage>165</fpage>
          <lpage>79</lpage>
          <pub-id pub-id-type="doi">10.1177/001440290507100203</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref35">
        <label>35</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Appelbaum</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Cooper</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Kline</surname>
              <given-names>RB</given-names>
            </name>
            <name name-style="western">
              <surname>Mayo-Wilson</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Nezu</surname>
              <given-names>AM</given-names>
            </name>
            <name name-style="western">
              <surname>Rao</surname>
              <given-names>SM</given-names>
            </name>
          </person-group>
          <article-title>Journal article reporting standards for quantitative research in psychology: the APA Publications and Communications Board task force report</article-title>
          <source>Am Psychol</source>
          <year>2018</year>
          <month>01</month>
          <volume>73</volume>
          <issue>1</issue>
          <fpage>3</fpage>
          <lpage>25</lpage>
          <pub-id pub-id-type="doi">10.1037/amp0000191</pub-id>
          <pub-id pub-id-type="medline">29345484</pub-id>
          <pub-id pub-id-type="pii">2018-00750-002</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref36">
        <label>36</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Radley</surname>
              <given-names>KC</given-names>
            </name>
            <name name-style="western">
              <surname>Dart</surname>
              <given-names>EH</given-names>
            </name>
            <name name-style="western">
              <surname>Fischer</surname>
              <given-names>AJ</given-names>
            </name>
            <name name-style="western">
              <surname>Collins</surname>
              <given-names>TA</given-names>
            </name>
          </person-group>
          <article-title>Publication trends for single‐case methodology in school psychology: a systematic review</article-title>
          <source>Psychol Schs</source>
          <year>2020</year>
          <month>05</month>
          <volume>57</volume>
          <issue>5</issue>
          <fpage>683</fpage>
          <lpage>98</lpage>
          <pub-id pub-id-type="doi">10.1002/pits.22359</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref37">
        <label>37</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Tarlow</surname>
              <given-names>KR</given-names>
            </name>
          </person-group>
          <article-title>An improved rank correlation effect size statistic for single-case designs: baseline corrected Tau</article-title>
          <source>Behav Modif</source>
          <year>2017</year>
          <month>07</month>
          <volume>41</volume>
          <issue>4</issue>
          <fpage>427</fpage>
          <lpage>67</lpage>
          <pub-id pub-id-type="doi">10.1177/0145445516676750</pub-id>
          <pub-id pub-id-type="medline">27831527</pub-id>
          <pub-id pub-id-type="pii">0145445516676750</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref38">
        <label>38</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Radianti</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Majchrzak</surname>
              <given-names>TA</given-names>
            </name>
            <name name-style="western">
              <surname>Fromm</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Wohlgenannt</surname>
              <given-names>I</given-names>
            </name>
          </person-group>
          <article-title>A systematic review of immersive virtual reality applications for higher education: design elements, lessons learned, and research agenda</article-title>
          <source>Comput Educ</source>
          <year>2020</year>
          <month>04</month>
          <volume>147</volume>
          <fpage>103778</fpage>
          <pub-id pub-id-type="doi">10.1016/j.compedu.2019.103778</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref39">
        <label>39</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Cooper</surname>
              <given-names>JO</given-names>
            </name>
            <name name-style="western">
              <surname>Heron</surname>
              <given-names>TE</given-names>
            </name>
            <name name-style="western">
              <surname>Heward</surname>
              <given-names>WL</given-names>
            </name>
          </person-group>
          <source>Applied Behavior Analysis. 3rd edition</source>
          <year>2019</year>
          <publisher-loc>London, UK</publisher-loc>
          <publisher-name>Pearson</publisher-name>
        </nlm-citation>
      </ref>
      <ref id="ref40">
        <label>40</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Suresh</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>An overview of randomization techniques: an unbiased assessment of outcome in clinical research</article-title>
          <source>J Hum Reprod Sci</source>
          <year>2011</year>
          <month>01</month>
          <volume>4</volume>
          <issue>1</issue>
          <fpage>8</fpage>
          <lpage>11</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://www.jhrsonline.org/article.asp?issn=0974-1208;year=2011;volume=4;issue=1;spage=8;epage=11;aulast=Suresh"/>
          </comment>
          <pub-id pub-id-type="doi">10.4103/0974-1208.82352</pub-id>
          <pub-id pub-id-type="medline">21772732</pub-id>
          <pub-id pub-id-type="pii">JHRS-4-8</pub-id>
          <pub-id pub-id-type="pmcid">PMC3136079</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref41">
        <label>41</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lane</surname>
              <given-names>KL</given-names>
            </name>
            <name name-style="western">
              <surname>Oakes</surname>
              <given-names>WP</given-names>
            </name>
            <name name-style="western">
              <surname>Powers</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Diebold</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Germer</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Common</surname>
              <given-names>EA</given-names>
            </name>
            <name name-style="western">
              <surname>Brunsting</surname>
              <given-names>N</given-names>
            </name>
          </person-group>
          <article-title>Improving teachers’ knowledge of functional assessment-based interventions: outcomes of a professional development series</article-title>
          <source>Educ Treat Child</source>
          <year>2015</year>
          <month>2</month>
          <volume>38</volume>
          <issue>1</issue>
          <fpage>93</fpage>
          <lpage>120</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jstor.org/stable/44683853"/>
          </comment>
          <pub-id pub-id-type="doi">10.1353/etc.2015.0001</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref42">
        <label>42</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Alexander</surname>
              <given-names>JL</given-names>
            </name>
            <name name-style="western">
              <surname>Smith</surname>
              <given-names>KA</given-names>
            </name>
            <name name-style="western">
              <surname>Mataras</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Shepley</surname>
              <given-names>SB</given-names>
            </name>
            <name name-style="western">
              <surname>Ayres</surname>
              <given-names>KM</given-names>
            </name>
          </person-group>
          <article-title>A meta-analysis and systematic review of the literature to evaluate potential threats to internal validity in probe procedures for chained tasks</article-title>
          <source>J Spec Educ</source>
          <year>2014</year>
          <month>09</month>
          <day>19</day>
          <volume>49</volume>
          <issue>3</issue>
          <fpage>135</fpage>
          <lpage>45</lpage>
          <pub-id pub-id-type="doi">10.1177/0022466914550096</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref43">
        <label>43</label>
        <nlm-citation citation-type="web">
          <article-title>React</article-title>
          <source>Meta Platforms</source>
          <year>2022</year>
          <access-date>2022-09-10</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://reactjs.org/">https://reactjs.org/</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref44">
        <label>44</label>
        <nlm-citation citation-type="web">
          <article-title>IBM Watson products</article-title>
          <source>IBM</source>
          <access-date>2022-09-10</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.ibm.com/watson/products-services">https://www.ibm.com/watson/products-services</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref45">
        <label>45</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Carroll</surname>
              <given-names>RA</given-names>
            </name>
            <name name-style="western">
              <surname>Joachim</surname>
              <given-names>BT</given-names>
            </name>
            <name name-style="western">
              <surname>St Peter</surname>
              <given-names>CC</given-names>
            </name>
            <name name-style="western">
              <surname>Robinson</surname>
              <given-names>N</given-names>
            </name>
          </person-group>
          <article-title>A comparison of error-correction procedures on skill acquisition during discrete-trial instruction</article-title>
          <source>J Appl Behav Anal</source>
          <year>2015</year>
          <volume>48</volume>
          <issue>2</issue>
          <fpage>257</fpage>
          <lpage>73</lpage>
          <pub-id pub-id-type="doi">10.1002/jaba.205</pub-id>
          <pub-id pub-id-type="medline">25913105</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref46">
        <label>46</label>
        <nlm-citation citation-type="web">
          <article-title>Google Natural Language AI</article-title>
          <source>Google</source>
          <year>2022</year>
          <access-date>2022-09-09</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://cloud.google.com/natural-language">https://cloud.google.com/natural-language</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref47">
        <label>47</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Shapiro</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Kazemi</surname>
              <given-names>E</given-names>
            </name>
          </person-group>
          <article-title>A review of training strategies to teach individuals implementation of behavioral interventions</article-title>
          <source>J Organ Behav Manag</source>
          <year>2017</year>
          <month>02</month>
          <day>14</day>
          <volume>37</volume>
          <issue>1</issue>
          <fpage>32</fpage>
          <lpage>62</lpage>
          <pub-id pub-id-type="doi">10.1080/01608061.2016.1267066</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref48">
        <label>48</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hattie</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Timperley</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <article-title>The power of feedback</article-title>
          <source>Rev Educ Res</source>
          <year>2007</year>
          <month>3</month>
          <volume>77</volume>
          <issue>1</issue>
          <fpage>81</fpage>
          <lpage>112</lpage>
          <pub-id pub-id-type="doi">10.3102/003465430298487</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref49">
        <label>49</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Fritz</surname>
              <given-names>CO</given-names>
            </name>
            <name name-style="western">
              <surname>Morris</surname>
              <given-names>PE</given-names>
            </name>
            <name name-style="western">
              <surname>Richler</surname>
              <given-names>JJ</given-names>
            </name>
          </person-group>
          <article-title>Effect size estimates: current use, calculations, and interpretation</article-title>
          <source>J Exp Psychol Gen</source>
          <year>2012</year>
          <month>02</month>
          <volume>141</volume>
          <issue>1</issue>
          <fpage>2</fpage>
          <lpage>18</lpage>
          <pub-id pub-id-type="doi">10.1037/a0024338</pub-id>
          <pub-id pub-id-type="medline">21823805</pub-id>
          <pub-id pub-id-type="pii">2011-16756-001</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref50">
        <label>50</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Conroy</surname>
              <given-names>RM</given-names>
            </name>
          </person-group>
          <article-title>What hypotheses do “nonparametric” two-group tests actually test?</article-title>
          <source>Stata J</source>
          <year>2012</year>
          <month>06</month>
          <day>01</day>
          <volume>12</volume>
          <issue>2</issue>
          <fpage>182</fpage>
          <lpage>90</lpage>
          <pub-id pub-id-type="doi">10.1177/1536867x1201200202</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref51">
        <label>51</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Cohen</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Statistical power analysis</article-title>
          <source>Curr Dir Psychol Sci</source>
          <year>1992</year>
          <month>06</month>
          <volume>1</volume>
          <issue>3</issue>
          <fpage>98</fpage>
          <lpage>101</lpage>
          <pub-id pub-id-type="doi">10.1111/1467-8721.ep10768783</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref52">
        <label>52</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Benjamini</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Hochberg</surname>
              <given-names>Y</given-names>
            </name>
          </person-group>
          <article-title>Controlling the false discovery rate: a practical and powerful approach to multiple testing</article-title>
          <source>J R Stat Soc Series B Stat Methodol</source>
          <year>1995</year>
          <volume>57</volume>
          <issue>1</issue>
          <fpage>289</fpage>
          <lpage>300</lpage>
          <pub-id pub-id-type="doi">10.1111/j.2517-6161.1995.tb02031.x</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref53">
        <label>53</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Blanca</surname>
              <given-names>MM</given-names>
            </name>
            <name name-style="western">
              <surname>Alarcón</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Arnau</surname>
              <given-names>GJ</given-names>
            </name>
            <name name-style="western">
              <surname>Bono</surname>
              <given-names>CR</given-names>
            </name>
            <name name-style="western">
              <surname>Bendayan</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>Non-normal data: is ANOVA still a valid option?</article-title>
          <source>Psicothema</source>
          <year>2017</year>
          <month>11</month>
          <volume>29</volume>
          <issue>4</issue>
          <fpage>552</fpage>
          <lpage>7</lpage>
          <pub-id pub-id-type="doi">10.7334/psicothema2016.383</pub-id>
          <pub-id pub-id-type="medline">29048317</pub-id>
          <pub-id pub-id-type="pii">4434</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref54">
        <label>54</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Blanca</surname>
              <given-names>MJ</given-names>
            </name>
            <name name-style="western">
              <surname>Alarcón</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Arnau</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Bono</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Bendayan</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>Effect of variance ratio on ANOVA robustness: might 1.5 be the limit?</article-title>
          <source>Behav Res Methods</source>
          <year>2018</year>
          <month>06</month>
          <volume>50</volume>
          <issue>3</issue>
          <fpage>937</fpage>
          <lpage>62</lpage>
          <pub-id pub-id-type="doi">10.3758/s13428-017-0918-2</pub-id>
          <pub-id pub-id-type="medline">28643157</pub-id>
          <pub-id pub-id-type="pii">10.3758/s13428-017-0918-2</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref55">
        <label>55</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Yu</surname>
              <given-names>Z</given-names>
            </name>
          </person-group>
          <article-title>A meta-analysis of the effect of virtual reality technology use in education</article-title>
          <source>Interact Learn Environ (forthcoming)</source>
          <year>2021</year>
          <month>10</month>
          <day>20</day>
          <fpage>1</fpage>
          <lpage>21</lpage>
          <pub-id pub-id-type="doi">10.1080/10494820.2021.1989466</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref56">
        <label>56</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Feng</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>González</surname>
              <given-names>VA</given-names>
            </name>
            <name name-style="western">
              <surname>Amor</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Lovreglio</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Cabrera-Guerrero</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <article-title>Immersive virtual reality serious games for evacuation training and research: a systematic literature review</article-title>
          <source>Comput Educ</source>
          <year>2018</year>
          <month>12</month>
          <volume>127</volume>
          <fpage>252</fpage>
          <lpage>66</lpage>
          <pub-id pub-id-type="doi">10.1016/j.compedu.2018.09.002</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref57">
        <label>57</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Sveinbjörnsdóttir</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Jóhannsson</surname>
              <given-names>SH</given-names>
            </name>
            <name name-style="western">
              <surname>Oddsdóttir</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Sigurðardóttir</surname>
              <given-names>TÞ</given-names>
            </name>
            <name name-style="western">
              <surname>Valdimarsson</surname>
              <given-names>GI</given-names>
            </name>
            <name name-style="western">
              <surname>Vilhjálmsson</surname>
              <given-names>HH</given-names>
            </name>
          </person-group>
          <article-title>Virtual discrete trial training for teacher trainees</article-title>
          <source>J Multimodal User Interfaces</source>
          <year>2019</year>
          <month>1</month>
          <day>2</day>
          <volume>13</volume>
          <issue>1</issue>
          <fpage>31</fpage>
          <lpage>40</lpage>
          <pub-id pub-id-type="doi">10.1007/s12193-018-0288-9</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref58">
        <label>58</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ericsson</surname>
              <given-names>KA</given-names>
            </name>
          </person-group>
          <article-title>Deliberate practice and the acquisition and maintenance of expert performance in medicine and related domains</article-title>
          <source>Acad Med</source>
          <year>2004</year>
          <month>10</month>
          <volume>79</volume>
          <issue>10 Suppl</issue>
          <fpage>S70</fpage>
          <lpage>81</lpage>
          <pub-id pub-id-type="doi">10.1097/00001888-200410001-00022</pub-id>
          <pub-id pub-id-type="medline">15383395</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref59">
        <label>59</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Matsuda</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Garcia</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Catagnus</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Brandt</surname>
              <given-names>JA</given-names>
            </name>
          </person-group>
          <article-title>Can behavior analysis help us understand and reduce racism? A review of the current literature</article-title>
          <source>Behav Anal Pract</source>
          <year>2020</year>
          <month>06</month>
          <volume>13</volume>
          <issue>2</issue>
          <fpage>336</fpage>
          <lpage>47</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/32642393"/>
          </comment>
          <pub-id pub-id-type="doi">10.1007/s40617-020-00411-4</pub-id>
          <pub-id pub-id-type="medline">32642393</pub-id>
          <pub-id pub-id-type="pii">411</pub-id>
          <pub-id pub-id-type="pmcid">PMC7314880</pub-id>
        </nlm-citation>
      </ref>
    </ref-list>
  </back>
</article>
