<?xml version="1.0" encoding="UTF-8"?><?xml-model type="application/xml-dtd" href="http://jats.nlm.nih.gov/publishing/1.1d3/JATS-journalpublishing1.dtd"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD JATS (Z39.96) Journal Publishing DTD v1.1d3 20150301//EN" "http://jats.nlm.nih.gov/publishing/1.1d3/JATS-journalpublishing1.dtd">
<article xmlns:ali="http://www.niso.org/schemas/ali/1.0" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xmlns:xlink="http://www.w3.org/1999/xlink" xmlns:mml="http://www.w3.org/1998/Math/MathML" dtd-version="1.1d3" specific-use="Marcalyc 1.2" article-type="research-article" xml:lang="en">
<front>
<journal-meta>
<journal-id journal-id-type="redalyc">3442</journal-id>
<journal-title-group>
<journal-title specific-use="original" xml:lang="es">TecnoLógicas</journal-title>
</journal-title-group>
<issn pub-type="ppub">0123-7799</issn>
<issn pub-type="epub">2256-5337</issn>
<publisher>
<publisher-name>Instituto Tecnológico Metropolitano</publisher-name>
<publisher-loc>
<country>Colombia</country>
<email>tecnologicas@itm.edu.co</email>
</publisher-loc>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="art-access-id" specific-use="redalyc">344262603026</article-id>
<article-id pub-id-type="doi">https://doi.org/10.22430/22565337.1475</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Artículos de investigación</subject>
</subj-group>
</article-categories>
<title-group>
<article-title xml:lang="en">Identity Verification in Virtual Education Using Biometric Analysis Based on Keystroke Dynamics</article-title>
<trans-title-group>
<trans-title xml:lang="es">Verificación de identidad en la educación virtual mediante análisis biométrico basado en la dinámica del tecleo</trans-title>
</trans-title-group>
</title-group>
<contrib-group>
<contrib contrib-type="author" corresp="no">
<contrib-id contrib-id-type="orcid">http://orcid.org/0000-0002-3257-0134</contrib-id>
<name name-style="western">
<surname>Escobar-Grisales</surname>
<given-names>Daniel.</given-names>
</name>
<xref ref-type="aff" rid="aff1"/>
<email>daniel.esobar@udea.edu.co</email>
</contrib>
<contrib contrib-type="author" corresp="no">
<contrib-id contrib-id-type="orcid">http://orcid.org/0000-0003-4946-9232</contrib-id>
<name name-style="western">
<surname>Vásquez-Correa</surname>
<given-names>Juan. C.</given-names>
</name>
<xref ref-type="aff" rid="aff2"/>
<email>jcamilo.vasquez@udea.edu.co</email>
</contrib>
<contrib contrib-type="author" corresp="no">
<contrib-id contrib-id-type="orcid">http://orcid.org/0000-0001-8794-6429</contrib-id>
<name name-style="western">
<surname>Vargas-Bonilla</surname>
<given-names>Jesús F.</given-names>
</name>
<xref ref-type="aff" rid="aff3"/>
<email>jesus.vargas@udea.edu.co</email>
</contrib>
<contrib contrib-type="author" corresp="no">
<contrib-id contrib-id-type="orcid">http://orcid.org/0000-0002-8507-0782</contrib-id>
<name name-style="western">
<surname>Orozco-Arroyave</surname>
<given-names>Juan Rafael</given-names>
</name>
<xref ref-type="aff" rid="aff4"/>
<email>rafael.orozco@udea.edu.co</email>
</contrib>
</contrib-group>
<aff id="aff1">
<institution content-type="original">MSc. in Electronics and Telecomunications Engineering, Faculty of Engineering. Universidad de Antioquia, Medellín-Colombia, daniel.esobar@udea.edu.co</institution>
<institution content-type="orgname">Universidad de Antioquia</institution>
<country country="CO">Colombia</country>
</aff>
<aff id="aff2">
<institution content-type="original">MSc. in Telecommunications engineering, Faculty of Engineering, Universidad de Antioquia, Medellín, Colombia; Pattern, Recognition Lab. Friedrih-Alexander-Universität, Erlangen-Nürnberg- Germany, Medellín-Colombia, jcamilo.vasquez@udea.edu.co</institution>
<institution content-type="orgname">Friedrih-Alexander-Universität</institution>
<country country="DE">Alemania</country>
</aff>
<aff id="aff3">
<institution content-type="original">PhD. in Cibernetcs and Telecommunications, Faculty of Engineering. Universidad de Antioquia, Medellín-Colombia, jesus.vargas@udea.edu.co</institution>
<institution content-type="orgname">Universidad de Antioquia</institution>
<country country="CO">Colombia</country>
</aff>
<aff id="aff4">
<institution content-type="original">PhD. in Computer Science, Faculty of Engineering, Universidad de Antioquia, Medellín, Colombia; Pattern Recognition Lab. Friedrih-Alexander-Universität, Erlangen-Nürnberg- Germany, Medellín-Colombia, rafael.orozco@udea.edu.co</institution>
<institution content-type="orgname">Friedrih-Alexander-Universität</institution>
<country country="DE">Alemania</country>
</aff>
<pub-date pub-type="epub-ppub">
<season>Enero-Abril</season>
<year>2020</year>
</pub-date>
<volume>23</volume>
<issue>47</issue>
<fpage>197</fpage>
<lpage>211</lpage>
<history>
<date date-type="received" publication-format="dd mes yyyy">
<day>13</day>
<month>09</month>
<year>2019</year>
</date>
<date date-type="accepted" publication-format="dd mes yyyy">
<day>05</day>
<month>12</month>
<year>2019</year>
</date>
</history>
<permissions>
<copyright-year>2020</copyright-year>
<copyright-holder>Instituto Tecnológico Metropolitano</copyright-holder>
<ali:free_to_read/>
<license xlink:href="https://creativecommons.org/licenses/by-nc-sa/4.0/">
<ali:license_ref>https://creativecommons.org/licenses/by-nc-sa/4.0/</ali:license_ref>
<license-p>Esta obra está bajo una Licencia Creative Commons Atribución-NoComercial-CompartirIgual 4.0 Internacional.</license-p>
</license>
</permissions>
<self-uri content-type="html" xlink:href="https://revistas.itm.edu.co/index.php/tecnologicas/article/view/1475">https://revistas.itm.edu.co/index.php/tecnologicas/article/view/1475</self-uri>
<abstract xml:lang="en">
<title>Abstract</title>
<p>Virtual education has become one of the tools most widely used by students at all educational levels, not just because of its convenience and flexibility, but also because it can expand educational coverage. All these benefits also bring along multiple issues in terms of security and reliability in the evaluation the of student’s knowledge because traditional identity verification strategies, such as the combination of username and password, do not guarantee that the student enrolled in the course really takes the exam. Therefore, a system with a different type of verification strategy should be designed to differentiate valid users from impostors. This study proposes a new verification system based on distances computed among Gaussian Mixture Models created with different writing task. The proposed approach is evaluated in two different modalities namely intrusive verification and non-intrusive verification. The intrusive mode provides a false positive rate of around 16 %, while the non-intrusive mode provides a false positive rate of 12 % In addition, the proposed strategy for non-intrusive verification is compared to a work previously reported in the literature and the results show that our approach reduces the equal error rate in about 24.3 %. The implemented strategy does not need additional hardware; only the computer keyboard is required to complete the user verification, which makes the system attractive, flexible, and practical for virtual education platforms.</p>
</abstract>
<trans-abstract xml:lang="es">
<title>Resumen</title>
<p>La educación virtual se ha convertido en una de las herramientas más utilizadas por los estudiantes en todos los niveles educativos, no solo por la comodidad y la flexibilidad, sino también por la posibilidad de ampliar la cobertura educativa en una población. Todos estos beneficios traen consigo múltiples problemas de seguridad y confiabilidad a la hora de evaluar el proceso de aprendizaje del estudiante, ya que las estrategias tradicionales de verificación de identidad, como la combinación de nombre de usuario y contraseña, no garantizan que el estudiante matriculado en el curso realmente realice el examen. Por lo tanto, es necesario diseñar un sistema con otro tipo de estrategia de verificación para diferenciar un usuario válido de un impostor. Este estudio propone un nuevo método de verificación, basado en el cálculo de distancias entre los modelos de mezclas gaussianas creados con diferentes tareas de escritura. El enfoque propuesto es evaluado en dos modalidades diferentes llamadas verificación intrusiva y verificación no intrusiva. El modo intrusivo proporciona una tasa de falsos positivos de 16 %, mientras el modo no intrusivo provee una tasa de falsos positivos de 12 %. Además, la estrategia propuesta para verificación no intrusiva es comparada con un trabajo previamente reportado en la literatura y los resultados muestran que nuestro enfoque reduce la tasa de error en aproximadamente un 24.3 %. La estrategia implementada no necesita hardware adicional, solo es requerido el teclado del computador para realizar la verificación, lo que hace que el sistema sea atractivo y flexible para ser usado en plataformas de educación virtual.</p>
</trans-abstract>
<kwd-group xml:lang="en">
<title>Keywords</title>
<kwd>Biometrics</kwd>
<kwd>Identity verification</kwd>
<kwd>Keystroke dynamics</kwd>
<kwd>Virtual Education</kwd>
</kwd-group>
<kwd-group xml:lang="es">
<title>Palabras clave</title>
<kwd>Biometría</kwd>
<kwd>dinámica de tecleo</kwd>
<kwd>educación virtual</kwd>
<kwd>verificación de identidad</kwd>
</kwd-group>
<counts>
<fig-count count="9"/>
<table-count count="5"/>
<equation-count count="5"/>
<ref-count count="19"/>
</counts>
<custom-meta-group>
<custom-meta>
<meta-name>Cómo citar / How to cite</meta-name>
<meta-value>D. Escobar-Grisales, J. C. Vásquez-Correa, J. F. Vargas-Bonilla, J. R. Orozco-Arroyave, “Identity verification in virtual education using biometric analysis based on keystroke dynamics”, <italic>TecnoLógicas,</italic> vol. 23, no. 47, pp. 197-211, 2020. <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.22430/22565337.147">https://doi.org/10.22430/22565337.147</ext-link>
</meta-value>
</custom-meta>
</custom-meta-group>
</article-meta>
</front>
<body>
<sec>
<title>
<bold>1. INTRODUCTION</bold>
</title>
<p>Virtual Education (VE) offers multiple benefits, not only because of its convenience and flexibility for students and teachers, but also because it can improve educational coverage, especially in remote areas with limited access to resources. Nevertheless, the quality of virtual education is controversial although, according to the U.S. Department of Education <sup>[<xref ref-type="bibr" rid="redalyc_344262603026_ref1">1</xref>]</sup>, online students achieve a better performance than those who take face-to-face classes. Furthermore, online students tend to be self-motivated, self-disciplined, and self-directed, which makes VE a very popular modality nowadays.</p>
<p>The freedom students experience in VE also produces security and reliability issues, especially when giving tests and exams According to Bretag <sup>[<xref ref-type="bibr" rid="redalyc_344262603026_ref2">2</xref>]</sup>, fraud in VE is higher and more worrying than in traditional education. For instance, 95 % of the students in Israel and 69 % in Korea admitted to committing fraud in virtual exams or tests and the trend is similar in the rest of the world <sup>[<xref ref-type="bibr" rid="redalyc_344262603026_ref2">2</xref>]</sup>. For this reason, virtual tests are not used in evaluations such as admission exams or final tests by universities.</p>
<p>In general terms, biometric systems can be classified into two approaches: verification and identification <sup>[<xref ref-type="bibr" rid="redalyc_344262603026_ref3">3</xref>]</sup>. In identification, the biometric features of a user are compared to multiple users in a database in order to find the identity of the user among all the individuals. In verification, a previously registered user logs-in to the system and the biometric features of the user are compared with the biometric features of the register.</p>
<p>Depending the similarity of the features, the system may decide whether the user is valid or not.</p>
<p>Keystroke Dynamics (KD) analysis is a very good option to capture biometric information to control who has access to certain information or platforms. One of the main advantages of KD is that it does not require the use of additional hardware, i.e., the identity of a user can be verified with a regular keyboard computer.</p>
<p>KD analysis started in the 20th century when telegraph operators had to transmit dozens of words in a short period of time, developing a distinctive rhythm that was captured by the operators on the other side of the line to identify who was transmitting <sup>[<xref ref-type="bibr" rid="redalyc_344262603026_ref4">4</xref>]</sup>. Later, in 1990, Joyce and Grupta <sup>[<xref ref-type="bibr" rid="redalyc_344262603026_ref5">5</xref>]</sup> extracted specific digital signatures to identify users based on their KD.</p>
<p>The authors asked users to type their username and password 8 times to compute a curve with the average time they took to enter the data. At a later login, the system compared the average curve with the new curve generated in the new login. Then, the system detected whether the user was valid or an impostor based on a measure of similarity between the two curves. The system was evaluated with 30 valid users and 27 impostors.</p>
<p>As a result, there was a total of 30 valid access attempts and 810 intruder access attempts. The authors reported a False Positive Rate (FPR) of 0.25 % and a False Negative Rate (FNR) of 16.0 %. The system had several usability issues since the user was requested to type the data correctly.</p>
<p>The system was biased by cases where a user deleted wrong characters. A similar strategy was proposed in <sup>[<xref ref-type="bibr" rid="redalyc_344262603026_ref6">6</xref>]</sup> to identify 173 users based on their KD. The users attended a programming course at the Helsinki University, and the data were extracted based on their programming exercises. The authors created a student profile based on the average hold time when pressing any key, the average hold time when pressing a particular key, the average time when pressing two particular keys, and a combination of the three previous times. The similarity between the evaluation sample and the database was measured with the Euclidean distance.</p>
<p>The authors reported accuracies of up to 97 %. In <sup>[<xref ref-type="bibr" rid="redalyc_344262603026_ref7">7</xref>]</sup>, the authors proposed a model to verify user identity with features extracted when users typed a password on a smartphone. The authors asked 94 different users to type the password “.tieRoanl” in order to extract features such as pressure when touching the screen, coordinates of the pressing point, and times when the finger presses or releases the screen. The authors computed several statistical functionals from the keystrokes and obtained a set of 155 features. The most important features were selected based on a minimum Redundancy Maximum Relevance (mRMR) algorithm. The selected features included pressure and coordinates. The authors reported an accuracy of 97.4 % using a Support Vector Machine (SVM) classifier. In recent years, identity verification based on KD has captured the attention of the research community. For instance, a keystroke dynamic application was presented in <sup>[<xref ref-type="bibr" rid="redalyc_344262603026_ref8">8</xref>]</sup>. In the study, the authors created a keyprint (typing fingerprints) to authenticate users in online courses.  The aim of a keyprint is to capture few data with specific characteristics of a user’s KD; therefore, only data with unusual values of typing dynamics are considered. The authors claim that this system is suitable for verification but not for identification.</p>
<p>They also showed that two samples from the same user are very unlikely to be exactly the same; therefore, to determine the similarity between the samples, a 𝑡-test (𝛼 = 0.05) is enough. The decision is made based on the equal error rate (EER), i.e., where FPR and FNR are the same. The authors reported an accuracy of 80 %, but the main drawback of the approach was that users needed to type least 964 characters to be correctly identified.</p>
<p>A strategy to authenticate a user identity based on KD is proposed in <sup>[<xref ref-type="bibr" rid="redalyc_344262603026_ref9">9</xref>]</sup>. Where the identity of the users is verified by comparing enrollment and log-in information. 63 users where asked to type 5 items of personal information: name, last name, email address, nationality, and national ID.</p>
<p>The database comprised 12 genuine accesses and 12 impostor access per user to enroll, for a total of 7560 samples. Six genuine samples were used to register the user; and the rest, to log in. The authors tested different features and, but the best result was obtained using time between key press and release and the difference between the time of pressing a key and releasing the following one. With these features and a classifier based on the Modified Scaled Manhattan distance, they obtained an EER of 2.4 %. In <sup>[<xref ref-type="bibr" rid="redalyc_344262603026_ref9">9</xref>]</sup>, this result was achieved because the identity of users was verified using KD when they typed data such as name, email address, and other information. As users are similar with these data, the KD will probably not vary from one sample to the next, which allows systems to verify users’ identify in a more accurate way.</p>
<sec>
<title>
<bold>1.1 Contribution of this study</bold>
</title>
<p>This paper proposes a methodology to verify the identity of students based on their KD. The proposed approach is tested on two different modalities: intrusive and non-intrusive. The first mode considers the case when the subject is aware of being tested, and the second mode considers the case where the subject is not aware of the verification process, and then a different writing task is required to verify the identity of the subject.</p>
<p>The features extracted from the writing tasks are used to create Gaussian Mixture Models (GMM). Those models are compared using probabilistic distances to make the decision whether a user is valid or not. The main difference of the proposed method with respect to others reported in the literature is that our approach is based on probabilistic models instead of the direct comparison of feature sets. The results indicate that it is possible to detect intruders with accuracies of up to 89 %, measured in the EER.</p>
</sec>
</sec>
<sec>
<title>
<bold>2. MATERIALS AND METHODS</bold>
</title>
<sec>
<title>
<bold>2.1 Participants</bold>
</title>
<p>A total of 170 subjects (116 male) participated in this study. The average age was 24 years old. The subjects were asked to perform 5 different tasks which were</p>
<p>designed to capture the KD over different regions of the keyboard. Most users were undergraduate students from the University of Antioquia. Users with higher education attainment were also considered.</p>
<p>In addition, 20 of the 170 users performed different tasks in two different sessions. (<xref ref-type="table" rid="gt1">Table 1</xref>) details participants’ information.</p>
<p>
<table-wrap id="gt1">
<label>Table 1</label>
<caption>
<title>Demographic information of the participants in this study</title>
</caption>
<alt-text>Table 1 Demographic information of the participants in this study</alt-text>
<alternatives>
<graphic xlink:href="344262603026_gt2.png" position="anchor" orientation="portrait"/>
<table style="width:  208.2pt;border-collapse:collapse;border:none;  " id="gt2-526564616c7963">
<tbody>
<tr style="height:14.2pt">
<td style="width:77.75pt;border-top:solid windowtext 1.0pt;   border-left:none;border-bottom:solid windowtext 1.0pt;border-right:none;      padding:0cm 5.4pt 0cm 5.4pt;height:14.2pt"/>
<td style="width:71.85pt;border-top:solid windowtext 1.0pt;   border-left:none;border-bottom:solid windowtext 1.0pt;border-right:none;      padding:0cm 5.4pt 0cm 5.4pt;height:14.2pt">Male</td>
<td style="width:58.6pt;border-top:solid windowtext 1.0pt;   border-left:none;border-bottom:solid windowtext 1.0pt;border-right:none;      padding:0cm 5.4pt 0cm 5.4pt;height:14.2pt">Female</td>
</tr>
<tr style="height:14.2pt">
<td style="width:77.75pt;border:none;   padding:0cm 5.4pt 0cm 5.4pt;height:14.2pt">Subjects</td>
<td style="width:71.85pt;border:none;   padding:0cm 5.4pt 0cm 5.4pt;height:14.2pt">116</td>
<td style="width:58.6pt;border:none;   padding:0cm 5.4pt 0cm 5.4pt;height:14.2pt">54</td>
</tr>
<tr style="height:14.2pt">
<td style="width:77.75pt;border:none;padding:0cm 5.4pt 0cm 5.4pt;   height:14.2pt">Age (µ ± σ)</td>
<td style="width:71.85pt;border:none;padding:0cm 5.4pt 0cm 5.4pt;   height:14.2pt">23 ± 5.8</td>
<td style="width:58.6pt;border:none;padding:0cm 5.4pt 0cm 5.4pt;   height:14.2pt">24 ± 7.1</td>
</tr>
<tr style="height:14.2pt">
<td style="width:77.75pt;border:none;padding:0cm 5.4pt 0cm 5.4pt;   height:14.2pt">Students</td>
<td style="width:71.85pt;border:none;padding:0cm 5.4pt 0cm 5.4pt;   height:14.2pt">102</td>
<td style="width:58.6pt;border:none;padding:0cm 5.4pt 0cm 5.4pt;   height:14.2pt">44</td>
</tr>
<tr style="height:14.2pt">
<td style="width:77.75pt;border:none;padding:0cm 5.4pt 0cm 5.4pt;   height:14.2pt">Graduate</td>
<td style="width:71.85pt;border:none;padding:0cm 5.4pt 0cm 5.4pt;   height:14.2pt">6</td>
<td style="width:58.6pt;border:none;padding:0cm 5.4pt 0cm 5.4pt;   height:14.2pt">7</td>
</tr>
<tr style="height:14.2pt">
<td style="width:77.75pt;border:none;padding:0cm 5.4pt 0cm 5.4pt;   height:14.2pt">MSc</td>
<td style="width:71.85pt;border:none;padding:0cm 5.4pt 0cm 5.4pt;   height:14.2pt">4</td>
<td style="width:58.6pt;border:none;padding:0cm 5.4pt 0cm 5.4pt;   height:14.2pt">-</td>
</tr>
<tr style="height:14.2pt">
<td style="width:77.75pt;border:none;border-bottom:solid windowtext 1.0pt;   padding:0cm 5.4pt 0cm 5.4pt;height:14.2pt">PhD</td>
<td style="width:71.85pt;border:none;border-bottom:solid windowtext 1.0pt;   padding:0cm 5.4pt 0cm 5.4pt;height:14.2pt">4</td>
<td style="width:58.6pt;border:none;border-bottom:solid windowtext 1.0pt;   padding:0cm 5.4pt 0cm 5.4pt;height:14.2pt">3</td>
</tr>
</tbody>
</table>
</alternatives>
<attrib>Source: Created by the authors.</attrib>
</table-wrap>
</p>
</sec>
<sec>
<title>
<bold>2.2 Data collection</bold>
</title>
<p>Each user of the database performed 5 different tasks the first 4 tasks were designed to capture specific movements on the keyboard. For instance, task 1 captures long horizontal displacements. In this task, the user typed the sentence “<italic>El sapo de mi casa come queso, zapallo y xoubas</italic>”. Here, the characters of each word follow other characters on the opposite side of the keyboard; thus, it is possible to define the user’s dynamics while moving from one side to the other. (<xref ref-type="fig" rid="gf1">Fig. 1a</xref>) shows the keyboard regions involved in this task.</p>
<p>
<fig id="gf1">
<label>Fig. 1.</label>
<caption>
<title>(a) Task 1, long displacement on the horizontal axis; (b) Task 2, short displacement on the horizontal axis; (c) Task, 3 top displacement on the vertical axis; and (d) Task 4, lower displacement on the vertical axis.</title>
</caption>
<alt-text>Fig. 1. (a) Task 1, long displacement on the horizontal axis; (b) Task 2, short displacement on the horizontal axis; (c) Task, 3 top displacement on the vertical axis; and (d) Task 4, lower displacement on the vertical axis.</alt-text>
<graphic xlink:href="344262603026_gf2.png" position="anchor" orientation="portrait"/>
<attrib>Source: Created by the authors.</attrib>
</fig>
</p>
<p>The arrow indicates displacements between the two regions. Similarly, task 2, “<italic>En un pueblo un niño juega afuera y tu vejez es notable</italic>”, aims to capture short displacements along the horizontal axis. These displacements are shown in (<xref ref-type="fig" rid="gf1">Fig. 1b</xref>). Task 3, “<italic>La leña esta partida, la tijera se ha roto, yo quiero jugar y reír, dale a la gata sus gatitos y las fresas y las patatas del huerto</italic>”, connects characters in the middle row of the keyboard with some in the top row, defining top vertical displacements. This task is shown in (<xref ref-type="fig" rid="gf1">Fig. 1c</xref>).</p>
<p>Finally, task 4, “<italic>La vaca flaca, las lañas malvas, las jacas blancas, a la sal acabas la salsa, zancada flaca</italic>”, requires the user to connect characters in the middle row with characters in the bottom row, defining the lower vertical displacements, as shown in (<xref ref-type="fig" rid="gf1">Fig. 1d</xref>). To define users’ KD in normal conditions, we considered the task 5, which has a total of 500 characters. This task was extracted from the novel <italic>Frankenstein or the modern Prometheus</italic> by Mary Shelly <sup>[<xref ref-type="bibr" rid="redalyc_344262603026_ref10">10</xref>].</sup> (<xref ref-type="table" rid="gt2">Table 2</xref>) details the size of each task.</p>
<p>
<table-wrap id="gt2">
<label>Table 2</label>
<caption>
<title>Length of each task</title>
</caption>
<alt-text>Table 2 Length of each task</alt-text>
<alternatives>
<graphic xlink:href="344262603026_gt3.png" position="anchor" orientation="portrait"/>
<table style="border-collapse:collapse;border:none;  " id="gt3-526564616c7963">
<tbody>
<tr style="height:14.4pt">
<td style="width:50.85pt;border-top:solid windowtext 1.0pt;   border-left:none;border-bottom:solid windowtext 1.0pt;border-right:none;      padding:0cm 5.4pt 0cm 5.4pt;height:14.4pt">Tasks</td>
<td style="width:76.45pt;border-top:solid windowtext 1.0pt;   border-left:none;border-bottom:solid windowtext 1.0pt;border-right:none;      padding:0cm 5.4pt 0cm 5.4pt;height:14.4pt">Character count</td>
<td style="width:71.2pt;border-top:solid windowtext 1.0pt;   border-left:none;border-bottom:solid windowtext 1.0pt;border-right:none;      padding:0cm 5.4pt 0cm 5.4pt;height:14.4pt">Word count</td>
</tr>
<tr style="height:14.4pt">
<td style="width:50.85pt;border:none;   padding:0cm 5.4pt 0cm 5.4pt;height:14.4pt">1</td>
<td style="width:76.45pt;border:none;   padding:0cm 5.4pt 0cm 5.4pt;height:14.4pt">54</td>
<td style="width:71.2pt;border:none;   padding:0cm 5.4pt 0cm 5.4pt;height:14.4pt">11</td>
</tr>
<tr style="height:14.4pt">
<td style="width:50.85pt;border:none;padding:0cm 5.4pt 0cm 5.4pt;   height:14.4pt">2</td>
<td style="width:76.45pt;border:none;padding:0cm 5.4pt 0cm 5.4pt;   height:14.4pt">56</td>
<td style="width:71.2pt;border:none;padding:0cm 5.4pt 0cm 5.4pt;   height:14.4pt">12</td>
</tr>
<tr style="height:14.4pt">
<td style="width:50.85pt;border:none;padding:0cm 5.4pt 0cm 5.4pt;   height:14.4pt">3</td>
<td style="width:76.45pt;border:none;padding:0cm 5.4pt 0cm 5.4pt;   height:14.4pt">133</td>
<td style="width:71.2pt;border:none;padding:0cm 5.4pt 0cm 5.4pt;   height:14.4pt">28</td>
</tr>
<tr style="height:14.4pt">
<td style="width:50.85pt;border:none;padding:0cm 5.4pt 0cm 5.4pt;   height:14.4pt">4</td>
<td style="width:76.45pt;border:none;padding:0cm 5.4pt 0cm 5.4pt;   height:14.4pt">92</td>
<td style="width:71.2pt;border:none;padding:0cm 5.4pt 0cm 5.4pt;   height:14.4pt">17</td>
</tr>
<tr style="height:14.4pt">
<td style="width:50.85pt;border:none;border-bottom:solid windowtext 1.0pt;   padding:0cm 5.4pt 0cm 5.4pt;height:14.4pt">5</td>
<td style="width:76.45pt;border:none;border-bottom:solid windowtext 1.0pt;   padding:0cm 5.4pt 0cm 5.4pt;height:14.4pt">518</td>
<td style="width:71.2pt;border:none;border-bottom:solid windowtext 1.0pt;   padding:0cm 5.4pt 0cm 5.4pt;height:14.4pt">90</td>
</tr>
</tbody>
</table>
</alternatives>
<attrib>Source: Created by the authors.</attrib>
</table-wrap>
</p>
</sec>
<sec>
<title>
<bold>2.3 Methods</bold>
</title>
<p>A user registers in the platform by typing the first 4 tasks previously described in the (<xref ref-type="fig" rid="gf1">Fig 1</xref>). When the user types, the system returns data from the KD. The user-model is created with the KD data. When the user logs into the platform, s/he should type one of the 5 tasks following a procedure similar to the one completed during registration stage. A login model is created per user and compared to the model created during registration stage. Finally, if the distance between these two models is short, the user is classified as valid; otherwise, the user is classified as an intruder. The general methodology is summarized in (<xref ref-type="fig" rid="gf2">Fig. 2</xref>). The next subsections detail the methods applied at each stage of the methodology.</p>
<p>
<fig id="gf2">
<label>Fig. 2.</label>
<caption>
<title>General methodology implemented in this study. The upper part of the methodology shows the registration stage; and the lower part, the log-in stage.</title>
</caption>
<alt-text>Fig. 2.  General methodology implemented in this study. The upper part of the methodology shows the registration stage; and the lower part, the log-in stage.</alt-text>
<graphic xlink:href="344262603026_gf3.png" position="anchor" orientation="portrait"/>
<attrib>Source: Created by the authors.</attrib>
</fig>
</p>
</sec>
<sec>
<title>
<bold>2.4 Raw information extracted from the computer to model KD</bold>
</title>
<p>Computers can provide the ASCII code of the characters that are typed when a text is written. They can also store the time the keys were pressed (P) and released (R). (<xref ref-type="table" rid="gt3">Table 3</xref>) shows an example with the raw information that can be extracted when the word “Hola” is typed.</p>
<p>
<table-wrap id="gt3">
<label>Table 3</label>
<caption>
<title>Example of data captured by the platform Word hola p press r release</title>
</caption>
<alt-text>Table 3 Example of data captured by the platform Word hola p press r release</alt-text>
<alternatives>
<graphic xlink:href="344262603026_gt4.png" position="anchor" orientation="portrait"/>
<table style="width:  389.95pt;border-collapse:collapse;border:none;  " id="gt4-526564616c7963">
<tbody>
<tr style="height:15.1pt">
<td style="width:80.25pt;border-top:solid windowtext 1.0pt;   border-left:none;border-bottom:solid windowtext 1.0pt;border-right:none;      padding:0cm 5.4pt 0cm 5.4pt;height:15.1pt">Key</td>
<td style="width:78.75pt;border-top:solid windowtext 1.0pt;   border-left:none;border-bottom:solid windowtext 1.0pt;border-right:none;      padding:0cm 5.4pt 0cm 5.4pt;height:15.1pt">Code</td>
<td style="width:118.45pt;border-top:solid windowtext 1.0pt;   border-left:none;border-bottom:solid windowtext 1.0pt;border-right:none;      padding:0cm 5.4pt 0cm 5.4pt;height:15.1pt">Operation</td>
<td style="width:112.5pt;border-top:solid windowtext 1.0pt;   border-left:none;border-bottom:solid windowtext 1.0pt;border-right:none;      padding:0cm 5.4pt 0cm 5.4pt;height:15.1pt">Time(ms)</td>
</tr>
<tr style="height:15.1pt">
<td style="width:80.25pt;border:none;   padding:0cm 5.4pt 0cm 5.4pt;height:15.1pt">H</td>
<td style="width:78.75pt;border:none;   padding:0cm 5.4pt 0cm 5.4pt;height:15.1pt">72</td>
<td style="width:118.45pt;border:none;   padding:0cm 5.4pt 0cm 5.4pt;height:15.1pt">P</td>
<td style="width:112.5pt;border:none;   padding:0cm 5.4pt 0cm 5.4pt;height:15.1pt">3301</td>
</tr>
<tr style="height:15.1pt">
<td style="width:80.25pt;border:none;padding:0cm 5.4pt 0cm 5.4pt;   height:15.1pt">O</td>
<td style="width:78.75pt;border:none;padding:0cm 5.4pt 0cm 5.4pt;   height:15.1pt">111</td>
<td style="width:118.45pt;border:none;padding:0cm 5.4pt 0cm 5.4pt;   height:15.1pt">P</td>
<td style="width:112.5pt;border:none;padding:0cm 5.4pt 0cm 5.4pt;   height:15.1pt">3524</td>
</tr>
<tr style="height:15.1pt">
<td style="width:80.25pt;border:none;padding:0cm 5.4pt 0cm 5.4pt;   height:15.1pt">H</td>
<td style="width:78.75pt;border:none;padding:0cm 5.4pt 0cm 5.4pt;   height:15.1pt">72</td>
<td style="width:118.45pt;border:none;padding:0cm 5.4pt 0cm 5.4pt;   height:15.1pt">R</td>
<td style="width:112.5pt;border:none;padding:0cm 5.4pt 0cm 5.4pt;   height:15.1pt">3556</td>
</tr>
<tr style="height:15.1pt">
<td style="width:80.25pt;border:none;padding:0cm 5.4pt 0cm 5.4pt;   height:15.1pt">O</td>
<td style="width:78.75pt;border:none;padding:0cm 5.4pt 0cm 5.4pt;   height:15.1pt">111</td>
<td style="width:118.45pt;border:none;padding:0cm 5.4pt 0cm 5.4pt;   height:15.1pt">R</td>
<td style="width:112.5pt;border:none;padding:0cm 5.4pt 0cm 5.4pt;   height:15.1pt">3612</td>
</tr>
<tr style="height:15.1pt">
<td style="width:80.25pt;border:none;padding:0cm 5.4pt 0cm 5.4pt;   height:15.1pt">L</td>
<td style="width:78.75pt;border:none;padding:0cm 5.4pt 0cm 5.4pt;   height:15.1pt">108</td>
<td style="width:118.45pt;border:none;padding:0cm 5.4pt 0cm 5.4pt;   height:15.1pt">P</td>
<td style="width:112.5pt;border:none;padding:0cm 5.4pt 0cm 5.4pt;   height:15.1pt">3644</td>
</tr>
<tr style="height:15.1pt">
<td style="width:80.25pt;border:none;padding:0cm 5.4pt 0cm 5.4pt;   height:15.1pt">L</td>
<td style="width:78.75pt;border:none;padding:0cm 5.4pt 0cm 5.4pt;   height:15.1pt">108</td>
<td style="width:118.45pt;border:none;padding:0cm 5.4pt 0cm 5.4pt;   height:15.1pt">R</td>
<td style="width:112.5pt;border:none;padding:0cm 5.4pt 0cm 5.4pt;   height:15.1pt">3692</td>
</tr>
<tr style="height:15.1pt">
<td style="width:80.25pt;border:none;padding:0cm 5.4pt 0cm 5.4pt;   height:15.1pt">A</td>
<td style="width:78.75pt;border:none;padding:0cm 5.4pt 0cm 5.4pt;   height:15.1pt">97</td>
<td style="width:118.45pt;border:none;padding:0cm 5.4pt 0cm 5.4pt;   height:15.1pt">P</td>
<td style="width:112.5pt;border:none;padding:0cm 5.4pt 0cm 5.4pt;   height:15.1pt">3716</td>
</tr>
<tr style="height:15.1pt">
<td style="width:80.25pt;border:none;border-bottom:solid windowtext 1.0pt;   padding:0cm 5.4pt 0cm 5.4pt;height:15.1pt">A</td>
<td style="width:78.75pt;border:none;border-bottom:solid windowtext 1.0pt;   padding:0cm 5.4pt 0cm 5.4pt;height:15.1pt">97</td>
<td style="width:118.45pt;border:none;border-bottom:solid windowtext 1.0pt;   padding:0cm 5.4pt 0cm 5.4pt;height:15.1pt">R</td>
<td style="width:112.5pt;border:none;border-bottom:solid windowtext 1.0pt;   padding:0cm 5.4pt 0cm 5.4pt;height:15.1pt">3820</td>
</tr>
</tbody>
</table>
</alternatives>
<attrib>Source: Created by the authors.</attrib>
</table-wrap>
</p>
<p>
<bold>Table 3.</bold> Example of data captured by the platform. Word= “hola”, p: press, r: release.</p>
</sec>
<sec>
<title>
<bold>2.5 User Characterization</bold>
</title>
<p>The objective of this stage is to find a feature matrix 𝑋 ∈ ℝ <sup>𝑛,𝑘</sup> associated to each user. 𝑛 refers to the number of segments, and 𝑘 is the number of extracted features. <xref ref-type="fig" rid="gf3">(Fig. 3</xref>). Describes the feature matrix 𝑋. Note that each task might have a different number of segments (rows), but the number of features is fixed. The characterization process is divided into two parts: segmentation and feature extraction.</p>
<p>
<fig id="gf3">
<label>Fig. 3.</label>
<caption>
<title>Feature matrix 𝑋 of each user.</title>
</caption>
<alt-text>Fig. 3. Feature matrix 𝑋 of each user.</alt-text>
<graphic xlink:href="344262603026_gf4.png" position="anchor" orientation="portrait"/>
<attrib>Source: Created by the authors.</attrib>
</fig>
</p>
<sec>
<title>
<bold>2.5.1. Segmentation</bold>
</title>
<p>Each row in 𝑋 refers to a specific segment of the text that the user has typed. These segments were based on a tri-graph model, which consists of small packets with the information of three consecutive characters. A similar strategy was considered in another study for identity verification based on speech signals <sup>[<xref ref-type="bibr" rid="redalyc_344262603026_ref11">11</xref>]</sup>.</p>
<p>For our analysis a sliding window of 5 tri-graphs, with an overlap of 3 tri-graphs, was used, as shown in (<xref ref-type="fig" rid="gf4">Fig. 4</xref>).</p>
<p>
<fig id="gf4">
<label>Fig. 4.</label>
<caption>
<title>Segmentation of the sentence: “El sapo de mi casa co”. Trigraphs (blue), segment1 (green), and segment 2 (dotted line).</title>
</caption>
<alt-text>Fig. 4. Segmentation of the sentence: “El sapo de mi casa co”. Trigraphs (blue), segment1 (green), and segment 2 (dotted line).</alt-text>
<graphic xlink:href="344262603026_gf5.png" position="anchor" orientation="portrait"/>
<attrib>Source: Created by the authors.</attrib>
</fig>
</p>
</sec>
<sec>
<title>
<bold>2.5.2 Feature extraction</bold>
</title>
<p>A total of six-time series are created when the user types each character: three when the key is pressed and three when the key is released. These times are shown in Table 3. With this information, it is possible to extract 2 main features: <bold>Hold time</bold>, which is the time between press and release of a key; and <bold>Flight time</bold>, which is the time between pressing a key and pressing the next one, as described in (<xref ref-type="fig" rid="gf9">Fig 5</xref>). The thirteen features that are extracted per segment are described below:</p>
<p>
<fig id="gf9">
<label>Fig. 5.</label>
<caption>
<title>Hold Time: time between press and release of a key. Flight Time: time between pressing a key and pressing the next one.</title>
</caption>
<alt-text>Fig. 5. Hold Time: time between press and release of a key. Flight Time: time between pressing a key and pressing the next one.</alt-text>
<graphic xlink:href="344262603026_gf6.png" position="anchor" orientation="portrait"/>
<attrib>Source: Created by the authors.</attrib>
</fig>
</p>
<p>· Total Hold Time (𝑇<sub>𝐻𝑇</sub>): the sum of the hold times of the characters.</p>
<p>· Average Hold Time (<italic>A</italic>
<sub>𝐻𝑇</sub>): the sum of the hold times of the characters divided by the number of characters.</p>
<p>Standard Deviation of the Hold Time (𝜎<sub>𝐻𝑇</sub>): the deviation of the Hold times with respect to <italic>A</italic>
<sub>𝐻𝑇</sub>
</p>
<p>· Strong Key (𝑆<sub>𝐾</sub>): the code of the key, with shorter hold time.</p>
<p>· Time Strong Key (𝑇<sub>𝑆𝐾</sub>): the minimum hold time.</p>
<p>· Weak Key (𝑊<sub>𝐾</sub>): the code of the key, with longer hold time.</p>
<p>· Time Weak Key (𝑇<sub>𝑊𝐾</sub>): the maximum hold time.</p>
<p>· Total Flight Time (𝑇<sub>𝐹𝑇</sub>): the sum of flight times of the characters.</p>
<p>· Average Flight Time (𝐴<sub>𝐹𝑇</sub>): the sum of the Flight times of the characters divided by the number of characters.</p>
<p>· Standard Deviation of the Flight Time (𝜎<sub>𝐹𝑇</sub>): the deviation of the Flight times with respect to 𝐴<sub>𝐹𝑇</sub>.</p>
<p>· Strong Key in Flight (𝑆<sub>𝐾𝐹</sub>): the code of the key, with shorter flight time.</p>
<p>· Time Strong Key in Flight (𝑇<sub>𝑆𝐾𝐹</sub>): the minimum flight time</p>
<p>· Weak Key in Flight (𝑊<sub>𝐾𝐹</sub>):  the code of the key, with longer flight time.</p>
<p>· Time Weak Key in Flight (𝑇<sub>𝑊𝐾𝐹</sub>): the maximum flight time.</p>
<p>Once the feature matrix has been created per user, it is necessary to find a representation to model the distribution of the features. The models created in the registration stage are compared with those created in the log-in stage. We considered Gaussian Mixture Models (GMM) to create those models and the Bhattacharyya distance to compare them, as explained below.</p>
</sec>
</sec>
<sec>
<title>
<bold>2.6  Gaussian Mixture Model</bold>
</title>
<p>A GMM is a probabilistic model created to represent a population from a linear combination of Gaussian distributions.</p>
<p>Each Gaussian of the GMM models a specific group of samples in a population<sup> [<xref ref-type="bibr" rid="redalyc_344262603026_ref12">12</xref>], [<xref ref-type="bibr" rid="redalyc_344262603026_ref13">13</xref>]. </sup>Equation (<xref ref-type="disp-formula" rid="e1">1</xref>) shows the mathematical expression for a GMM of a multivariate random variable 𝒙, which corresponds to the sum of 𝑀 Gaussian distributions, weighted by a parameter 𝐶<sub>𝑚</sub>.</p>
<p>
<disp-formula id="e1">
<label>(1)</label>
<graphic xlink:href="344262603026_ee2.png" position="anchor" orientation="portrait"/>
</disp-formula>
</p>
<p>A compact way to represent GMM models is indicated in (<xref ref-type="disp-formula" rid="e2">2</xref>).</p>
<p>
<disp-formula id="e2">
<label>(2)</label>
<graphic xlink:href="344262603026_ee3.png" position="anchor" orientation="portrait"/>
</disp-formula>
</p>
<p>Three parameters should be estimated in the GMM modeling approach: weight 𝐶<sub>𝑚</sub>, mean vector 𝝁<sub>𝑚</sub>, and covariance matrix 𝜮<bold>
<sub>𝑚</sub>
</bold>. 𝑚 is the index for the Gaussians. These parameters are estimated using the Expectation–Maximization (EM) algorithm. The total number of Gaussians 𝑀 must be defined before starting the estimation procedure, and it can be done according to the Bayesian Information Criterion (BIC) <sup>[<xref ref-type="bibr" rid="redalyc_344262603026_ref14">14</xref>]</sup>, which measures the quantity of information lost when the model is used.</p>
<p>However, in case of problems where there is no prior knowledge of the data, the number of Gaussian distributions is found experimentally <sup>[<xref ref-type="bibr" rid="redalyc_344262603026_ref11">11</xref>]</sup>.</p>
</sec>
<sec>
<title>
<bold>2.7 Classification</bold>
</title>
<p>Each user is represented by a GMM.</p>
<p>Thus, to calculate the similarity between two models (registration: 𝑓<sub>𝑖</sub>(𝑥) and log-in: 𝑔<sub>𝑖</sub>(𝑥)), we can use the Bhattacharyya distance ( 𝐷<sub>𝑏ℎ𝑎</sub>), where 𝝁<sub>𝑚</sub> and the 𝜮<bold>
<sub>𝑚</sub>
</bold> of each GMM are taken into account <sup>[<xref ref-type="bibr" rid="redalyc_344262603026_ref15">15</xref>]</sup>.</p>
<p>𝐷<sub>𝐵ℎ𝑎</sub> can be expressed as in (<xref ref-type="disp-formula" rid="e3">3</xref>):</p>
<p>
<disp-formula id="e3">
<label>(3)</label>
<graphic xlink:href="344262603026_ee4.png" position="anchor" orientation="portrait"/>
</disp-formula>
</p>
<p>where the first term considers the mean vectors of the GMMs, and the second term is the covariance matrix. As indicated in Equation (<xref ref-type="disp-formula" rid="e3">3</xref>), the similarity measurement between the two models, 𝑓<sub>𝑖</sub>(𝑥) and 𝑔<sub>𝑖</sub>(𝑥), considers the mean vectors and the covariance matrix separately. Mean vectors are compared in (<xref ref-type="disp-formula" rid="e4">4</xref>), while the covariance matrix is considered in (<xref ref-type="disp-formula" rid="e5">5</xref>).</p>
<p>
<disp-formula id="e4">
<label>(4)</label>
<graphic xlink:href="344262603026_ee5.png" position="anchor" orientation="portrait"/>
</disp-formula>
</p>
<p>
<disp-formula id="e5">
<label>(5)</label>
<graphic xlink:href="344262603026_ee6.png" position="anchor" orientation="portrait"/>
</disp-formula>
</p>
<p>Finally, depending on the similarity of both models, it is possible to classify the user’s identity. If the user is valid, the distance between the two models is expected to be less than the distance resulting from an impostor. However, it is necessary to define a threshold 𝑈 to decide whether a user is valid or an impostor.</p>
<p>This distance measurement has been considered in previous studies where GMM models resulting from speech recordings are compared <sup>[<xref ref-type="bibr" rid="redalyc_344262603026_ref16">16</xref>]</sup>.</p>
<p>(<xref ref-type="fig" rid="gf5">Fig. 6</xref>) and (<xref ref-type="fig" rid="gf6">Fig.7</xref>) show the flowchart of the registration and login stages, respectively. The number of components 𝑀 and the decision threshold 𝑈 are found in the training and development stage explained below.</p>
<p>
<fig id="gf5">
<label>Fig. 6.</label>
<caption>
<title>Flowchart of the registration stage</title>
</caption>
<alt-text>Fig. 6. Flowchart of the registration stage</alt-text>
<graphic xlink:href="344262603026_gf7.png" position="anchor" orientation="portrait"/>
<attrib>Source: Created by the authors.</attrib>
</fig>
</p>
<p>
<fig id="gf6">
<label>Fig. 7.</label>
<caption>
<title>Flowchart of the login stage</title>
</caption>
<alt-text>Fig. 7.  Flowchart of the login stage</alt-text>
<graphic xlink:href="344262603026_gf8.png" position="anchor" orientation="portrait"/>
<attrib>Source: Created by the authors.</attrib>
</fig>
</p>
</sec>
</sec>
<sec>
<title>
<bold>3. EXPERIMENTS AND RESULTS</bold>
</title>
<p>The test stage aims to evaluate the performance and usability of the system in two different modes: intrusive and non-intrusive verification. In the intrusive mode, the user is aware that his/her identity is being verified through the keyboard. On the other hand, in the non-intrusive mode the user does not know that is being verified.</p>
<sec>
<title>
<bold>3.1 Experiment 1: intrusive mode</bold>
</title>
<p>In the intrusive mode, two sessions are required because the registration and log-in writing tasks are the same, then we use the first session to register and the second to log-in the user. In this case only 20 of the 170 users have two sessions; therefore, this experiment was conducted with 20 users.</p>
<p>For this experiment a cross validation strategy was carried out with 5 folds (Subject independent in each fold).</p>
<p>Therefore 4 subjects were considered for the test and 16 were considered for the training. The (<xref ref-type="fig" rid="gf7">Fig.8</xref>) shows the test and train sets for each fold.</p>
<p>
<fig id="gf7">
<label>Fig. 8.</label>
<caption>
<title>EER when varying the decision threshold.</title>
</caption>
<alt-text>Fig. 8. EER when varying the decision threshold.</alt-text>
<graphic xlink:href="344262603026_gf9.png" position="anchor" orientation="portrait"/>
<attrib>Source: Created by the authors.</attrib>
</fig>
</p>
<sec>
<title>
<bold>3.1.1 Training of the GMM-based model</bold>
</title>
<p>The training stage is considered to find the optimal hyper-parameters of the classifier that makes the decision. The number of Gaussian components (𝑀) were optimized following a grid search strategy between 1 and 50 in steps of 3 (with selection criterion in the minimum EER).</p>
<p>The threshold 𝑈 was optimized between 0 and 1 up to steps of 10<sup>-3</sup> (selection criterion also in the EER).</p>
<p>These parameters are found for each fold. In each fold we consider the best M where the final EER was optimal. For this modality of intrusive verification, the optimal point is in 𝑀 = 34 ± 3.356 which is the median of the best M in each fold. The 𝑈 value was also varied from 0 to 1 for each 𝑀 and the average of the best thresholds along the folds is 𝑈 = 0.148 ± 0.006.</p>
</sec>
<sec>
<title>
<bold>3.1.2 Test of experiment 1</bold>
</title>
<p>The results of this experiment are shown in <xref ref-type="table" rid="gt9">Table 4</xref>. The performance is measured in terms of FPR and FNR. The usability of the method is measured in terms of the Cost to a User to Enroll (CUE) and the Cost to a User to Authenticate (CUA) <sup>[<xref ref-type="bibr" rid="redalyc_344262603026_ref17">17</xref>]</sup>. These costs refer to the number of keys required to be pressed to do the registration or authentication procedure. The registration model is generated with the first 4 tasks; therefore, the CUE is 314 keystrokes.</p>
<p>
<table-wrap id="gt9">
<label>Table 4</label>
<caption>
<title>Performance and usability metrics when generating login models with known tasks</title>
</caption>
<alt-text>Table 4 Performance and usability metrics when generating login models with known tasks</alt-text>
<alternatives>
<graphic xlink:href="344262603026_gt5.png" position="anchor" orientation="portrait"/>
<table style="width:  333.15pt;border-collapse:collapse;" id="gt5-526564616c7963">
<tbody>
<tr style="height:20.6pt">
<td style="width:89.15pt;border-top:solid windowtext 1.0pt;   border-left:none;border-bottom:solid windowtext 1.0pt;border-right:none;      padding:0cm 5.4pt 0cm 5.4pt;height:20.6pt">Log-in Tasks</td>
<td style="width:67.6pt;border-top:solid windowtext 1.0pt;   border-left:none;border-bottom:solid windowtext 1.0pt;border-right:none;      padding:0cm 5.4pt 0cm 5.4pt;height:20.6pt">FPR (µ±σ)</td>
<td style="width:66.75pt;border-top:solid windowtext 1.0pt;   border-left:none;border-bottom:solid windowtext 1.0pt;border-right:none;      padding:0cm 5.4pt 0cm 5.4pt;height:20.6pt">FNR (µ±σ)</td>
<td style="width:67.2pt;border-top:solid windowtext 1.0pt;   border-left:none;border-bottom:solid windowtext 1.0pt;border-right:none;      padding:0cm 5.4pt 0cm 5.4pt;height:20.6pt">EER (µ±σ)</td>
<td style="width:42.45pt;border-top:solid windowtext 1.0pt;   border-left:none;border-bottom:solid windowtext 1.0pt;border-right:none;      padding:0cm 5.4pt 0cm 5.4pt;height:20.6pt">CUA</td>
</tr>
<tr style="height:20.6pt">
<td style="width:89.15pt;border:none;   padding:0cm 5.4pt 0cm 5.4pt;height:20.6pt">
<bold>3</bold>
</td>
<td style="width:67.6pt;border:none;   padding:0cm 5.4pt 0cm 5.4pt;height:20.6pt">
<bold>11.8 ± 4.2</bold>
</td>
<td style="width:66.75pt;border:none;   padding:0cm 5.4pt 0cm 5.4pt;height:20.6pt">
<bold>19.5± 4.1</bold>
</td>
<td style="width:67.2pt;border:none;   padding:0cm 5.4pt 0cm 5.4pt;height:20.6pt">
<bold>15,7± 4.2 </bold>
</td>
<td style="width:42.45pt;border:none;   padding:0cm 5.4pt 0cm 5.4pt;height:20.6pt">
<bold>133</bold>
</td>
</tr>
<tr style="height:20.6pt">
<td style="width:89.15pt;border:none;border-bottom:solid windowtext 1.0pt;   padding:0cm 5.4pt 0cm 5.4pt;height:20.6pt">4</td>
<td style="width:67.6pt;border:none;border-bottom:solid windowtext 1.0pt;   padding:0cm 5.4pt 0cm 5.4pt;height:20.6pt">10.3 ± 3.6</td>
<td style="width:66.75pt;border:none;border-bottom:solid windowtext 1.0pt;   padding:0cm 5.4pt 0cm 5.4pt;height:20.6pt">22.5 ± 5.1</td>
<td style="width:67.2pt;border:none;border-bottom:solid windowtext 1.0pt;   padding:0cm 5.4pt 0cm 5.4pt;height:20.6pt">16,4 ± 4.4</td>
<td style="width:42.45pt;border:none;border-bottom:solid windowtext 1.0pt;   padding:0cm 5.4pt 0cm 5.4pt;height:20.6pt">91</td>
</tr>
</tbody>
</table>
</alternatives>
<attrib>Source: Created by the authors.</attrib>
</table-wrap>
</p>
<p>The log-in model is generated with Task 3 and Task 4 as it is indicated in Table 4. The minimum EER is obtained with task 3, however this is the task with the highest CUA. Tasks 1 and Task 2 do not have the minimum keystrokes required to perform their modeling with a GMM with 𝑀 = 34. A minimum of 2 𝑀 + 1 keystrokes is needed in order to estimate the GMM’s covariances, therefore these tasks were not included in the analysis.</p>
<p>
<bold>
<italic>3.2 Experiment 2: Non-intrusive mode</italic>
</bold>
</p>
<p>In  this  experiment,  tasks  1,  2,  3  and  4  were used to generate the user registration model,  in  the  same  way  as  in  the  previous  experiment.    The    difference    with    the    previous   experiment   is   that   the   login   model  is  generated  with  the  task  5.  The  task   5   is   divided   into   5   equal   length   chunks.   For   each   chunk,   the   distance   between the registration and log-in models is  computed.  To  decide  whether  a  user  is  valid   or   not,   the   average   distance   is   estimated  for  the  5  chunks  and  compared  to the decision threshold U</p>
<p>For this   experiment   there   are   170   different  users.  A  cross  validation  strategy  similar  to  that  developed  in  the  previous  experiment  was  used.  The  only  difference  with  respect  to  the  previous  experiment  is  that  here  we  addressed  a  10-fold   cross   validation  strategy,  then  153  subjects  are  used for the training stage and 17 subjects are    used    in    the    test    stage    (subject    independent in each fold).</p>
</sec>
</sec>
<sec>
<title>
<bold>3.2.1 Training of the GMM-based model</bold>
</title>
<p>The strategy for the training of the GMM-based model in this experiment is the same as the previous experiment. For this experiment the optimal hyper-parameters are: 𝑀 = 36 ± 6.074  and 𝑈 = 0.013 ± 0.021</p>
</sec>
<sec>
<title>
<bold>3.2.2 Test of the experiment 2</bold>
</title>
<p>
<xref ref-type="table" rid="gt10">Table 5</xref> shows the performance and usability of the system by varying the number of chunks used to decide whether the user is valid or not. In this case the CUE is the same as the previous experiment, because the same tasks are used to create the registration model.</p>
<p>
<table-wrap id="gt10">
<label>Table 5</label>
<caption>
<title>Performance and usability metrics generating login models with unknown tasks by the register model using an average distance</title>
</caption>
<alt-text>Table 5 Performance and usability metrics generating login models with unknown tasks by the register model using an average distance</alt-text>
<alternatives>
<graphic xlink:href="344262603026_gt6.png" position="anchor" orientation="portrait"/>
<table style="width:  417.65pt;border-collapse:collapse;border:none;  " id="gt6-526564616c7963">
<tbody>
<tr style="height:16.1pt">
<td style="width:88.4pt;border-top:solid windowtext 1.0pt;   border-left:none;border-bottom:solid windowtext 1.0pt;border-right:none;      padding:0cm 5.4pt 0cm 5.4pt;height:16.1pt">Used Chunks</td>
<td style="width:108.15pt;border-top:solid windowtext 1.0pt;   border-left:none;border-bottom:solid windowtext 1.0pt;border-right:none;      padding:0cm 5.4pt 0cm 5.4pt;height:16.1pt">FPR (µ±σ)</td>
<td style="width:74.2pt;border-top:solid windowtext 1.0pt;   border-left:none;border-bottom:solid windowtext 1.0pt;border-right:none;      padding:0cm 5.4pt 0cm 5.4pt;height:16.1pt">FNR (µ±σ)</td>
<td style="width:93.65pt;border-top:solid windowtext 1.0pt;   border-left:none;border-bottom:solid windowtext 1.0pt;border-right:none;      padding:0cm 5.4pt 0cm 5.4pt;height:16.1pt">EER (µ±σ)</td>
<td style="width:53.25pt;border-top:solid windowtext 1.0pt;   border-left:none;border-bottom:solid windowtext 1.0pt;border-right:none;      padding:0cm 5.4pt 0cm 5.4pt;height:16.1pt">CUA</td>
</tr>
<tr style="height:16.1pt">
<td style="width:88.4pt;border:none;   padding:0cm 5.4pt 0cm 5.4pt;height:16.1pt">1</td>
<td style="width:108.15pt;border:none;   padding:0cm 5.4pt 0cm 5.4pt;height:16.1pt">13.5 ± 0.9</td>
<td style="width:74.2pt;border:none;   padding:0cm 5.4pt 0cm 5.4pt;height:16.1pt">13.6± 0.5</td>
<td style="width:93.65pt;border:none;   padding:0cm 5.4pt 0cm 5.4pt;height:16.1pt">13.6 ± 0.7</td>
<td style="width:53.25pt;border:none;   padding:0cm 5.4pt 0cm 5.4pt;height:16.1pt">104</td>
</tr>
<tr style="height:16.1pt">
<td style="width:88.4pt;border:none;padding:0cm 5.4pt 0cm 5.4pt;   height:16.1pt">2</td>
<td style="width:108.15pt;border:none;padding:0cm 5.4pt 0cm 5.4pt;   height:16.1pt">18.8 ± 0.7</td>
<td style="width:74.2pt;border:none;padding:0cm 5.4pt 0cm 5.4pt;   height:16.1pt">9.6 ± 0.4</td>
<td style="width:93.65pt;border:none;padding:0cm 5.4pt 0cm 5.4pt;   height:16.1pt">14.2 ± 0.6</td>
<td style="width:53.25pt;border:none;padding:0cm 5.4pt 0cm 5.4pt;   height:16.1pt">208</td>
</tr>
<tr style="height:16.1pt">
<td style="width:88.4pt;border:none;padding:0cm 5.4pt 0cm 5.4pt;   height:16.1pt">3</td>
<td style="width:108.15pt;border:none;padding:0cm 5.4pt 0cm 5.4pt;   height:16.1pt">12.9 ± 1.0</td>
<td style="width:74.2pt;border:none;padding:0cm 5.4pt 0cm 5.4pt;   height:16.1pt">10.4 ± 0.5</td>
<td style="width:93.65pt;border:none;padding:0cm 5.4pt 0cm 5.4pt;   height:16.1pt">11.7 ± 0.8</td>
<td style="width:53.25pt;border:none;padding:0cm 5.4pt 0cm 5.4pt;   height:16.1pt">312</td>
</tr>
<tr style="height:16.1pt">
<td style="width:88.4pt;border:none;padding:0cm 5.4pt 0cm 5.4pt;   height:16.1pt">4</td>
<td style="width:108.15pt;border:none;padding:0cm 5.4pt 0cm 5.4pt;   height:16.1pt">14.1 ± 1.0</td>
<td style="width:74.2pt;border:none;padding:0cm 5.4pt 0cm 5.4pt;   height:16.1pt">10.0 ± 0.5</td>
<td style="width:93.65pt;border:none;padding:0cm 5.4pt 0cm 5.4pt;   height:16.1pt">12.1 ± 0.8</td>
<td style="width:53.25pt;border:none;padding:0cm 5.4pt 0cm 5.4pt;   height:16.1pt">416</td>
</tr>
<tr style="height:16.1pt">
<td style="width:88.4pt;border:none;border-bottom:solid windowtext 1.0pt;   padding:0cm 5.4pt 0cm 5.4pt;   height:16.1pt">5</td>
<td style="width:108.15pt;border:none;border-bottom:solid windowtext 1.0pt;   padding:0cm 5.4pt 0cm 5.4pt;   height:16.1pt">14.7 ± 1.0</td>
<td style="width:74.2pt;border:none;border-bottom:solid windowtext 1.0pt;   padding:0cm 5.4pt 0cm 5.4pt;   height:16.1pt">9.8 ± 0.4</td>
<td style="width:93.65pt;border:none;border-bottom:solid windowtext 1.0pt;   padding:0cm 5.4pt 0cm 5.4pt;   height:16.1pt">12.3 ± 0.7</td>
<td style="width:53.25pt;border:none;border-bottom:solid windowtext 1.0pt;   padding:0cm 5.4pt 0cm 5.4pt;   height:16.1pt">520</td>
</tr>
</tbody>
</table>
</alternatives>
<attrib>Source: Created by the authors.</attrib>
</table-wrap>
</p>
</sec>
<sec>
<title>
<bold>3.3 Experiment 3: comparison with another methodology in non-intrusive mode</bold>
</title>
<p>In the literature there are several works of biometric verification based on keystroke dynamic, but few verify identity of the user in a non-intrusive way. The methodology proposed in <sup>[<xref ref-type="bibr" rid="redalyc_344262603026_ref6">6</xref>]</sup> is a work of identity verification in non-intrusive mode.</p>
<p>We implemented this methodology with the 170 users of our database. In <sup>[<xref ref-type="bibr" rid="redalyc_344262603026_ref6">6</xref>]</sup>, the authors propose to create a student profile based on the average Hold time when pressing different keys. The similarity between registered and log-in samples is calculated by the Euclidean distance and a training set was taken to optimize the decision threshold.</p>
<p>This methodology was adapted to the problem of non-intrusive verification, using tasks 1 to 4 as register tasks and the task 5 for log-in.</p>
<p>(<xref ref-type="fig" rid="gf8">Fig. 9</xref>) shows the EER when varying the decision threshold from 0 to 7000 with steps of 10. <xref ref-type="fig" rid="gf8">Fig. 9</xref> shows an EER of 36 % when the threshold is 390. This is the minimum EER obtained using the methodology proposed in<sup> [<xref ref-type="bibr" rid="redalyc_344262603026_ref6">6</xref>]</sup> for a non-intrusive verification approach. As it can be observed, the approach proposed here, based on GMM models, is more accurate and reliable than other approaches reported in the literature.</p>
<p>
<fig id="gf8">
<label>Fig. 9.</label>
<caption>
<title>EER when varying the decision threshold.</title>
</caption>
<alt-text>Fig. 9. EER when varying the decision threshold.</alt-text>
<graphic xlink:href="344262603026_gf11.png" position="anchor" orientation="portrait"/>
<attrib>Source: Created by the authors.</attrib>
</fig>
</p>
</sec>
</sec>
<sec>
<title>
<bold>4.  CONCLUSIONS</bold>
</title>
<p>This study proposed a method for identity verification based on the statistical modeling of KD using GMMs. The main application of the proposed approach can be in virtual education platforms to verify the identity of a student when he/she is performing a test. The system was evaluated in two modes: (1) intrusive mode, which is text dependent, and (2) non-intrusive mode, which is text independent. (i.e., the user is not aware that his/her identity is being verified).</p>
<p>In the intrusive mode, the user logs-in the system with one of the tasks used in the registration stage. Since the log-in is performed with a fixed task, the user knows that the identity is being verified.</p>
<p>This mode showed an EER of 15.7 %. The usability of this mode was evaluated and showed a CUA of 133 keystrokes. This mode can be modified by changing the log-in tasks. For instance, the registration and log-in stages can be performed by typing the username and password. In this case the access to the system is the same than in the traditional manner. However, our proposed system provides an additional security layer because the user has to provide the username and the password with a valid KD to enter the system. The main drawback of the proposed approach is that the verification is only performed when the user logs-in the platform. If the valid user logs-in the platform but the exam is performed by an intruder, the system will not be able to detect the fraud.</p>
<p>In the non-intrusive mode, the log-in task is independent on the tasks used in the registration stage. In this case the user is not aware that is being verified. This mode achieved an EER of</p>
<p>. This mode can be used during evaluation activities because the identity of the user can be constantly verified without interrupting the activity. Although this mode presents a higher CUA compared to the other mode, this is not a problem because the verification can be performed based on any text typed by the user including those texts written during the examination.</p>
</sec>
</body>
<back>
<ack>
<p>The authors acknowledge to the GITA research group of the faculty of Engineering of the University of Antioquia. Also acknowledge to Ingeni@ of the faculty of Engineering of the University of Antioquia and the company Pratech S.A.S.</p>
</ack>
<ref-list>
<title>6. REFERENCES</title>
<ref id="redalyc_344262603026_ref1">
<label>[1]</label>
<mixed-citation>[1]  B. Means, Y. Toyama, R. Murphy, M. Bakia, and K. Jones, “Evaluation of Evidence-Based Practices in Online Learning: A Meta-Analysis and Review of Online Learning Studies,”, U.S Department of Education, Estados Unidos, Report ED-04- CO-0040 Task 0006, 2009. Available: <ext-link ext-link-type="uri" xlink:href="https://repository.alt.ac.uk/629/1/US_DepEdu_Final_report_2009.pdf">https://repository.alt.ac.uk/629/1/US_DepEdu_Final_report_2009.pdf</ext-link>
</mixed-citation>
<element-citation publication-type="report">
<person-group person-group-type="author">
<name>
<surname>Means</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Toyama</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Murphy</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Bakia</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Jones</surname>
<given-names>K.</given-names>
</name>
</person-group>
<source>Evaluation of Evidence-Based Practices in Online Learning: A Meta-Analysis and Review of Online Learning Studies</source>
<year>2009</year>
</element-citation>
</ref>
<ref id="redalyc_344262603026_ref2">
<label>[2]</label>
<mixed-citation>[2]  T. Bretag, <italic>Handbook of Academic Integrity</italic>. Singapore: Springer Singapore, 2016. <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1007/978-981-287-098-8">https://doi.org/10.1007/978-981-287-098-8</ext-link>
</mixed-citation>
<element-citation publication-type="book">
<person-group person-group-type="author">
<name>
<surname>Bretag</surname>
<given-names>T.</given-names>
</name>
</person-group>
<source>Handbook of Academic Integrity</source>
<year>2016</year>
</element-citation>
</ref>
<ref id="redalyc_344262603026_ref3">
<label>[3]</label>
<mixed-citation>[3]  A. K. Jain, A. Ross, and S. Prabhakar, “An Introduction to Biometric Recognition,” <italic>IEEE Trans. Circuits Syst. Video Technol.</italic>, vol. 14, no. 1, pp. 4–20, Jan. 2004. <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1109/TCSVT.2003.818349">https://doi.org/10.1109/TCSVT.2003.818349</ext-link>
</mixed-citation>
<element-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Jain</surname>
<given-names>A. K.</given-names>
</name>
<name>
<surname>Ross</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Prabhakar</surname>
<given-names>S.</given-names>
</name>
</person-group>
<source>IEEE Trans. Circuits Syst. Video Technol.</source>
<year>2004</year>
</element-citation>
</ref>
<ref id="redalyc_344262603026_ref4">
<label>[4]</label>
<mixed-citation>[4]  W. L. Bryan and N. Harter, “Studies in the physiology and psychology of the telegraphic language.,” <italic>Psychol. Rev.,</italic> vol. 4, no. 1, pp. 27–53, 1897. <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1037/h0073806">https://doi.org/10.1037/h0073806</ext-link>
</mixed-citation>
<element-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Bryan</surname>
<given-names>W. L.</given-names>
</name>
<name>
<surname>Harter</surname>
<given-names>N.</given-names>
</name>
</person-group>
<source>Psychol. Rev.</source>
<year>1897</year>
</element-citation>
</ref>
<ref id="redalyc_344262603026_ref5">
<label>[5]</label>
<mixed-citation>[5] R. Joyce and G. Gupta, “Identity authentication based on keystroke latencies,” <italic>Commun. ACM,</italic> vol. 33, no. 2, pp. 168–176, Feb. 1990. <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1145/75577.75582">https://doi.org/10.1145/75577.75582</ext-link>
</mixed-citation>
<element-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Joyce</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Gupta</surname>
<given-names>G.</given-names>
</name>
</person-group>
<source>Commun. ACM</source>
<year>1990</year>
</element-citation>
</ref>
<ref id="redalyc_344262603026_ref6">
<label>[6]</label>
<mixed-citation>[6]  K. Longi, J. Leinonen, H. Nygren, J. Salmi, A. Klami, and A. Vihavainen, “Identification of programmers from typing patterns,” in <italic>Proceedings of the 15th Koli Calling Conference on Computing Education Research - Koli Calling ’15,</italic> Koli Finland, 2015. pp. 60–67. <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1145/2828959.2828960">https://doi.org/10.1145/2828959.2828960</ext-link>
</mixed-citation>
<element-citation publication-type="confproc">
<person-group person-group-type="author">
<name>
<surname>Longi</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Leinonen</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Nygren</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Salmi</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Klami</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Vihavainen</surname>
<given-names>A.</given-names>
</name>
</person-group>
<source>Identification of programmers from typing patterns</source>
<year>2015</year>
</element-citation>
</ref>
<ref id="redalyc_344262603026_ref7">
<label>[7]</label>
<mixed-citation>[7] S. Krishnamoorthy, L. Rueda, S. Saad, and H. Elmiligi, “Identification of User Behavioral Biometrics for Authentication Using Keystroke Dynamics and Machine Learning,” in <italic>Proceedings of the 2018 2nd International Conference on Biometric Engineering and Applications - ICBEA ’18</italic>, Amsterdam, 2018. pp. 50–57. <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1145/3230820.3230829">https://doi.org/10.1145/3230820.3230829</ext-link>
</mixed-citation>
<element-citation publication-type="confproc">
<person-group person-group-type="author">
<name>
<surname>Krishnamoorthy</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Rueda</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Saad</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Elmiligi</surname>
<given-names>H.</given-names>
</name>
</person-group>
<source>Identification of User Behavioral Biometrics for Authentication Using Keystroke Dynamics and Machine Learning</source>
<year>2018</year>
</element-citation>
</ref>
<ref id="redalyc_344262603026_ref8">
<label>[8]</label>
<mixed-citation>[8] J. R. Young, R. S. Davies, J. L. Jenkins, and I. Pfleger, “Keystroke Dynamics: Establishing Keyprints to Verify Users in Online Courses,” <italic>Comput. Sch.</italic>, vol. 36, no. 1, pp. 48–68, Jan. 2019. <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1080/07380569.2019.1565905">https://doi.org/10.1080/07380569.2019.1565905</ext-link>
</mixed-citation>
<element-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Young</surname>
<given-names>J. R.</given-names>
</name>
<name>
<surname>Davies</surname>
<given-names>R. S.</given-names>
</name>
<name>
<surname>Jenkins</surname>
<given-names>J. L.</given-names>
</name>
<name>
<surname>Pfleger</surname>
<given-names>I.</given-names>
</name>
</person-group>
<source>Comput. Sch.</source>
<year>2019</year>
</element-citation>
</ref>
<ref id="redalyc_344262603026_ref9">
<label>[9]</label>
<mixed-citation>[9] A. Morales, M. Falanga, J. Fierrez, C. Sansone, and J. Ortega-Garcia, “Keystroke dynamics recognition based on personal data: A comparative experimental evaluation implementing reproducible research,” in <italic>2015 IEEE 7th International Conference on Biometrics Theory, Applications and Systems (BTAS)</italic>, Arlington, 2015. pp. 1–6. <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1109/BTAS.2015.7358772">https://doi.org/10.1109/BTAS.2015.7358772</ext-link>
</mixed-citation>
<element-citation publication-type="confproc">
<person-group person-group-type="author">
<name>
<surname>Morales</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Falanga</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Fierrez</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Sansone</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Ortega-Garcia</surname>
<given-names>J.</given-names>
</name>
</person-group>
<source>Keystroke dynamics recognition based on personal data: A comparative experimental evaluation implementing reproducible research</source>
<year>2015</year>
</element-citation>
</ref>
<ref id="redalyc_344262603026_ref10">
<label>[10]</label>
<mixed-citation>[10] M. W. Shelly. <italic>Frankestein or, the modern Prometheus</italic>. London: Penguin, 2007</mixed-citation>
<element-citation publication-type="book">
<person-group person-group-type="author">
<name>
<surname>Shelly.</surname>
<given-names>M. W.</given-names>
</name>
</person-group>
<source>Frankestein or, the modern Prometheus</source>
<year>2007</year>
</element-citation>
</ref>
<ref id="redalyc_344262603026_ref11">
<label>[11]</label>
<mixed-citation>[11] D. Yu and L. Deng, <italic>Automatic Speech Recognition</italic>. London: Springer London, 2015. <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1007/978-1-4471-5779-3">https://doi.org/10.1007/978-1-4471-5779-3</ext-link>
</mixed-citation>
<element-citation publication-type="book">
<person-group person-group-type="author">
<name>
<surname>Yu</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Deng</surname>
<given-names>L.</given-names>
</name>
</person-group>
<source>Automatic Speech Recognition</source>
<year>2015</year>
</element-citation>
</ref>
<ref id="redalyc_344262603026_ref12">
<label>[12]</label>
<mixed-citation>[12] D. A. Reynolds, T. F. Quatieri, and R. B. Dunn, “Speaker Verification Using Adapted Gaussian Mixture Models,” <italic>Digit. Signal Process.</italic>, vol. 10, no. 1–3, pp. 19–41, Jan. 2000. <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1006/dspr.1999.0361">https://doi.org/10.1006/dspr.1999.0361</ext-link>
</mixed-citation>
<element-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Reynolds</surname>
<given-names>D. A.</given-names>
</name>
<name>
<surname>Quatieri</surname>
<given-names>T. F.</given-names>
</name>
<name>
<surname>Dunn</surname>
<given-names>R. B.</given-names>
</name>
</person-group>
<source>Digit. Signal Process.</source>
<year>2000</year>
</element-citation>
</ref>
<ref id="redalyc_344262603026_ref13">
<label>[13]</label>
<mixed-citation>[13] D. A. Reynolds and R. C. Rose, “Robust text-independent speaker identification using Gaussian mixture speaker models,”<italic> IEEE Trans. Speech Audio Process.,</italic> vol. 3, no. 1, pp. 72–83, 1995. <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1109/89.365379">https://doi.org/10.1109/89.365379</ext-link>
</mixed-citation>
<element-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Reynolds</surname>
<given-names>D. A.</given-names>
</name>
<name>
<surname>Rose</surname>
<given-names>R. C.</given-names>
</name>
</person-group>
<source>IEEE Trans. Speech Audio Process</source>
<year>1995</year>
</element-citation>
</ref>
<ref id="redalyc_344262603026_ref14">
<mixed-citation>[14] M. Nishida and T. Kawahara, “Speaker model selection based on the Bayesian information criterion applied to unsupervised speaker indexing,”<italic> IEEE Trans. Speech Audio Process.</italic>, vol. 13, no. 4, pp. 583–592, Jul. 2005. <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1109/TSA.2005.848890">https://doi.org/10.1109/TSA.2005.848890</ext-link>
</mixed-citation>
<element-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Nishida</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Kawahara</surname>
<given-names>T.</given-names>
</name>
</person-group>
<source>IEEE Trans. Speech Audio Process</source>
<year>2005</year>
</element-citation>
</ref>
<ref id="redalyc_344262603026_ref15">
<label>[15]</label>
<mixed-citation>[15] P. Mahalanobis, "On the generalized distance in statistic", <italic>National Institute of Science of India</italic>, vol 2, no 1, pp. 49-55, Apr. 1936. Available: <ext-link ext-link-type="uri" xlink:href="http://library.isical.ac.in:8080/xmlui/bitstream/handle/123456789/6765/Vol02_1936_1_Art05-pcm.pdf?sequence=1&amp;isAllowed=y">http://library.isical.ac.in:8080/xmlui/bitstream/handle/123456789/6765/Vol02_1936_1_Art05-pcm.pdf?sequence=1&amp;isAllowed=y</ext-link>
</mixed-citation>
<element-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Mahalanobis</surname>
<given-names>P.</given-names>
</name>
</person-group>
<source>National Institute of Science of India</source>
<year>1936</year>
</element-citation>
</ref>
<ref id="redalyc_344262603026_ref16">
<label>[16]</label>
<mixed-citation>[16] T. Arias-Vergara, J.C. Vásquez-Correa, J. R. Orozco-Arroyave, J. F Vargas-Bonilla and E. Nöth, “Parkinson's Disease Progression Assessment from Speech Using GMM-UBM”, <italic>Proceedings of Interspeech</italic>, pp 1933-1937, San Francisco, 2016. Available: <ext-link ext-link-type="uri" xlink:href="https://www.isca-speech.org/archive/Interspeech_2016/pdfs/1122.PDF">https://www.isca-speech.org/archive/Interspeech_2016/pdfs/1122.PDF</ext-link>
</mixed-citation>
<element-citation publication-type="confproc">
<person-group person-group-type="author">
<name>
<surname>Arias-Vergara</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Vásquez-Correa</surname>
<given-names>J.C.</given-names>
</name>
<name>
<surname>Orozco-Arroyave</surname>
<given-names>J. R.</given-names>
</name>
<name>
<surname>Vargas-Bonilla</surname>
<given-names>J. F</given-names>
</name>
<name>
<surname>Nöth</surname>
<given-names>E.</given-names>
</name>
</person-group>
<source>Parkinson's Disease Progression Assessment from Speech Using GMM-UBM</source>
<year>2016</year>
</element-citation>
</ref>
<ref id="redalyc_344262603026_ref17">
<label>[17]</label>
<mixed-citation>[17]  A. Peacock, X. Ke, and M. Wilkerson, “Typing patterns: a key to user identification,<italic>”IEEE Secur. Priv. Mag.</italic>, vol. 2, no. 5, pp. 40–47, Sep. 2004. <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1109/MSP.2004.89">https://doi.org/10.1109/MSP.2004.89</ext-link>
</mixed-citation>
<element-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Peacock</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Ke</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Wilkerson</surname>
<given-names>M.</given-names>
</name>
</person-group>
<source>IEEE Secur. Priv. Mag.</source>
<year>2004</year>
</element-citation>
</ref>
<ref id="redalyc_344262603026_ref18">
<label>[18]</label>
<mixed-citation>[18] N. Garcia-Ospina, J.-R. Orozco-Arroyave, and J.-F. Vargas-Bonilla, “Speaker Verification System for Online Education Platforms,” in <italic>2018 International Carnahan Conference on Security Technology (ICCST)</italic>, Montreal, 2018. pp. 1–5. <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1109/CCST.2018.8585602">https://doi.org/10.1109/CCST.2018.8585602</ext-link>
</mixed-citation>
<element-citation publication-type="confproc">
<person-group person-group-type="author">
<name>
<surname>Garcia-Ospina</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Orozco-Arroyave</surname>
<given-names>J.-R.</given-names>
</name>
<name>
<surname>Vargas-Bonilla</surname>
<given-names>J.-F.</given-names>
</name>
</person-group>
<source>Speaker Verification System for Online Education Platforms</source>
<year>2018</year>
</element-citation>
</ref>
<ref id="redalyc_344262603026_ref19">
<label>[19]</label>
<mixed-citation>[19] X. Jiang, S. Wang, X. Xiang, and Y. Qian, “Integrating online i-vector into GMM-UBM for text-dependent speaker verification,” in <italic>2017 Asia-Pacific Signal and Information Processing Association Annual Summit and Conference (APSIPA ASC)</italic>, Kuala, 2017. pp. 1628–1632. <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1109/APSIPA.2017.8282293">https://doi.org/10.1109/APSIPA.2017.8282293</ext-link>
</mixed-citation>
<element-citation publication-type="confproc">
<person-group person-group-type="author">
<name>
<surname>Jiang</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Xiang</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Qian</surname>
<given-names>Y.</given-names>
</name>
</person-group>
<source>Integrating online i-vector into GMM-UBM for text-dependent speaker verification</source>
<year>2017</year>
</element-citation>
</ref>
</ref-list>
</back>
</article>