<?xml version="1.0" encoding="UTF-8"?><?xml-stylesheet type="text/xsl" href="static/style.xsl"?><OAI-PMH xmlns="http://www.openarchives.org/OAI/2.0/" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xsi:schemaLocation="http://www.openarchives.org/OAI/2.0/ http://www.openarchives.org/OAI/2.0/OAI-PMH.xsd"><responseDate>2026-05-06T18:52:07Z</responseDate><request verb="GetRecord" identifier="oai:riubu.ubu.es:10259/4221" metadataPrefix="xoai">https://riubu.ubu.es/oai/request</request><GetRecord><record><header><identifier>oai:riubu.ubu.es:10259/4221</identifier><datestamp>2021-11-10T09:38:16Z</datestamp><setSpec>com_10259_5377</setSpec><setSpec>com_10259_5086</setSpec><setSpec>com_10259_2604</setSpec><setSpec>com_10259_4219</setSpec><setSpec>col_10259_5378</setSpec><setSpec>col_10259_4220</setSpec></header><metadata><metadata xmlns="http://www.lyncode.com/xoai" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xsi:schemaLocation="http://www.lyncode.com/xoai http://www.lyncode.com/xsd/xoai.xsd">
<element name="dc">
<element name="contributor">
<element name="author">
<element name="none">
<field name="value">Arnaiz González, Álvar</field>
<field name="authority">39</field>
<field name="confidence">500</field>
<field name="orcid_id">0000-0001-6965-0237</field>
<field name="value">Diez Pastor, José Francisco</field>
<field name="authority">156</field>
<field name="confidence">500</field>
<field name="orcid_id"/>
<field name="value">Rodríguez Diez, Juan José</field>
<field name="authority">477</field>
<field name="confidence">500</field>
<field name="orcid_id"/>
<field name="value">García Osorio, César</field>
<field name="authority">212</field>
<field name="confidence">500</field>
<field name="orcid_id">0000-0002-1206-1084</field>
</element>
</element>
</element>
<element name="date">
<element name="accessioned">
<element name="none">
<field name="value">2016-09-01T09:42:59Z</field>
</element>
</element>
<element name="available">
<element name="none">
<field name="value">2016-09-01T09:42:59Z</field>
</element>
</element>
<element name="issued">
<element name="none">
<field name="value">2016-09</field>
</element>
</element>
<element name="embargoEndDate">
<element name="none"/>
</element>
</element>
<element name="identifier">
<element name="issn">
<element name="none">
<field name="value">0950-7051</field>
</element>
</element>
<element name="uri">
<element name="none">
<field name="value">http://hdl.handle.net/10259/4221</field>
</element>
</element>
<element name="doi">
<element name="none">
<field name="value">10.1016/j.knosys.2016.05.056</field>
</element>
</element>
</element>
<element name="description">
<element name="abstract">
<element name="en">
<field name="value">Over recent decades, database sizes have grown considerably. Larger sizes present new challenges, because machine learning algorithms are not prepared to process such large volumes of information. Instance selection methods can alleviate this problem when the size of the data set is medium to large. However, even these methods face similar problems with very large-to-massive data sets.&#xd;
&#xd;
In this paper, two new algorithms with linear complexity for instance selection purposes are presented. Both algorithms use locality-sensitive hashing   to find similarities between instances. While the complexity of conventional methods (usually quadratic, O(n2), or log-linear, O(nlogn)) means that they are unable to process large-sized data sets, the new proposal shows competitive results in terms of accuracy. Even more remarkably, it shortens execution time, as the proposal manages to reduce complexity and make it linear with respect to the data set size. The new proposal has been compared with some of the best known instance selection methods for testing and has also been evaluated on large data sets (up to a million instances).</field>
</element>
</element>
<element name="sponsorship">
<element name="en">
<field name="value">Supported by the Research Projects TIN 2011-24046 and TIN 2015-67534-P from the Spanish Ministry of Economy and Competitiveness.</field>
</element>
</element>
</element>
<element name="format">
<element name="mimetype">
<element name="none">
<field name="value">application/pdf</field>
</element>
</element>
</element>
<element name="language">
<element name="iso">
<element name="es">
<field name="value">eng</field>
</element>
</element>
</element>
<element name="publisher">
<element name="en">
<field name="value">Elsevier</field>
</element>
</element>
<element name="relation">
<element name="ispartof">
<element name="en">
<field name="value">Knowledge-Based Systems. 2016. V. 107, p. 83–95</field>
</element>
</element>
<element name="publisherversion">
<element name="none">
<field name="value">http://dx.doi.org/10.1016/j.knosys.2016.05.056</field>
</element>
</element>
<element name="projectID">
<element name="none">
<field name="value">info:eu-repo/grantAgreement/MINECO/TIN 2011-24046</field>
<field name="value">info:eu-repo/grantAgreement/MINECO/TIN 2015-67534-P</field>
</element>
</element>
</element>
<element name="rights">
<element name="none">
<field name="value">Attribution 4.0 International</field>
</element>
<element name="uri">
<element name="none">
<field name="value">http://creativecommons.org/licenses/by/4.0/</field>
</element>
</element>
<element name="accessRights">
<element name="none">
<field name="value">info:eu-repo/semantics/openAccess</field>
</element>
</element>
</element>
<element name="subject">
<element name="en">
<field name="value">Nearest neighbor</field>
<field name="value">Data reduction</field>
<field name="value">Instance selection</field>
<field name="value">Hashing</field>
<field name="value">Big data</field>
</element>
<element name="other">
<element name="es">
<field name="value">Informática</field>
</element>
<element name="en">
<field name="value">Computer science</field>
</element>
</element>
</element>
<element name="title">
<element name="en">
<field name="value">Instance selection of linear complexity for big data</field>
</element>
</element>
<element name="type">
<element name="none">
<field name="value">info:eu-repo/semantics/article</field>
</element>
<element name="hasVersion">
<element name="en">
<field name="value">info:eu-repo/semantics/publishedVersion</field>
</element>
</element>
</element>
</element>
<element name="bundles">
<element name="bundle">
<field name="name">CC-LICENSE</field>
<element name="bitstreams">
<element name="bitstream">
<field name="name">license_rdf</field>
<field name="originalName">license_rdf</field>
<field name="format">application/rdf+xml; charset=utf-8</field>
<field name="size">908</field>
<field name="url">https://riubu.ubu.es/bitstream/10259/4221/8/license_rdf</field>
<field name="checksum">0175ea4a2d4caec4bbcc37e300941108</field>
<field name="checksumAlgorithm">MD5</field>
<field name="sid">8</field>
</element>
</element>
</element>
<element name="bundle">
<field name="name">THUMBNAIL</field>
<element name="bitstreams">
<element name="bitstream">
<field name="name">Arnaiz-KBS_2016.pdf.jpg</field>
<field name="originalName">Arnaiz-KBS_2016.pdf.jpg</field>
<field name="description">IM Thumbnail</field>
<field name="format">image/jpeg</field>
<field name="size">3919</field>
<field name="url">https://riubu.ubu.es/bitstream/10259/4221/7/Arnaiz-KBS_2016.pdf.jpg</field>
<field name="checksum">e618d1f61323a2ed3cc538ca8ff0c262</field>
<field name="checksumAlgorithm">MD5</field>
<field name="sid">7</field>
</element>
</element>
</element>
<element name="bundle">
<field name="name">ORIGINAL</field>
<element name="bitstreams">
<element name="bitstream">
<field name="name">Arnaiz-KBS_2016.pdf</field>
<field name="originalName">Arnaiz-KBS_2016.pdf</field>
<field name="format">application/pdf</field>
<field name="size">1184745</field>
<field name="url">https://riubu.ubu.es/bitstream/10259/4221/1/Arnaiz-KBS_2016.pdf</field>
<field name="checksum">d4e42af8a5936dad7b8f6e543e96d24f</field>
<field name="checksumAlgorithm">MD5</field>
<field name="sid">1</field>
</element>
</element>
</element>
<element name="bundle">
<field name="name">LICENSE</field>
<element name="bitstreams">
<element name="bitstream">
<field name="name">license.txt</field>
<field name="originalName">license.txt</field>
<field name="format">text/plain; charset=utf-8</field>
<field name="size">1362</field>
<field name="url">https://riubu.ubu.es/bitstream/10259/4221/5/license.txt</field>
<field name="checksum">5d013bfa6e473ff0db22cd82a4d71a70</field>
<field name="checksumAlgorithm">MD5</field>
<field name="sid">5</field>
</element>
</element>
</element>
<element name="bundle">
<field name="name">TEXT</field>
<element name="bitstreams">
<element name="bitstream">
<field name="name">Arnaiz-KBS_2016.pdf.txt</field>
<field name="originalName">Arnaiz-KBS_2016.pdf.txt</field>
<field name="description">Extracted text</field>
<field name="format">text/plain</field>
<field name="size">67394</field>
<field name="url">https://riubu.ubu.es/bitstream/10259/4221/6/Arnaiz-KBS_2016.pdf.txt</field>
<field name="checksum">6389f85d4eac645f34bbf67d56f6eb1a</field>
<field name="checksumAlgorithm">MD5</field>
<field name="sid">6</field>
</element>
</element>
</element>
</element>
<element name="others">
<field name="handle">10259/4221</field>
<field name="identifier">oai:riubu.ubu.es:10259/4221</field>
<field name="lastModifyDate">2021-11-10 10:38:16.955</field>
</element>
<element name="repository">
<field name="name">Repositorio Institucional de la Universidad de Burgos</field>
<field name="mail">bubrep@ubu.es</field>
</element>
<element name="license">
<field name="bin">RWwgYXV0b3IgY29tbyDDum5pY28gdGl0dWxhciBkZSBsb3MgZGVyZWNob3MgZGUgcHJvcGllZGFkIGludGVsZWN0dWFsIGRlIGxhIG9icmEsIG8gZGlzcG9uaWVuZG8gZGUgbG9zIGRlYmlkb3MgcGVybWlzb3MgZGUgbG9zIG90cm9zIHRpdHVsYXJlcywgc2kgbG9zIGh1YmllcmEsIHkgZW4gdmlydHVkIGRlIGxvcyBkZXJlY2hvcyBxdWUgbGUgY29uZmllcmUgbGEgbGVnaXNsYWNpw7NuIHZpZ2VudGUgc29icmUgcHJvcGllZGFkIGludGVsZWN0dWFsIHkgZGVyZWNob3MgZGUgYXV0b3IsIApBVVRPUklaQSBhIGxhIFVuaXZlcnNpZGFkIGRlIEJ1cmdvcyBhIGRpZnVuZGlyLCBkZSBtYW5lcmEgZ3JhdHVpdGEsIGVsIGNvbnRlbmlkbyBkZSBsb3MgYXJjaGl2b3MgZGlnaXRhbGVzIHF1ZSBjb3JyZXNwb25kZW4gYWwgZG9jdW1lbnRvIGRlc2NyaXRvIGFudGVyaW9ybWVudGUsIGNvbiBjYXLDoWN0ZXIgbm8gZXhjbHVzaXZvIHkgZGUgbWFuZXJhIHDDumJsaWNhIGVuIGFjY2VzbyBhYmllcnRvIGEgdHJhdsOpcyBkZSBJbnRlcm5ldCwgcGFyYSBsbyBxdWUgbGEgQmlibGlvdGVjYSBwcm9jZWRlcsOhIGEgYXJjaGl2YXJsb3MgZW4gZWwgUmVwb3NpdG9yaW8gSW5zdGl0dWNpb25hbC4gQXNpbWlzbW8gYXV0b3JpemEgYSBsYSBVbml2ZXJzaWRhZCBkZSBCdXJnb3MgYSByZWFsaXphciBsYXMgdHJhbnNmb3JtYWNpb25lcyBuZWNlc2FyaWFzIGRlIGZvcm1hdG8sIG5vIGRlIGNvbnRlbmlkbywgcGFyYSBnYXJhbnRpemFyIGxhIHByZXNlcnZhY2nDs24geSBlbCBhY2Nlc28gZW4gZWwgZnV0dXJvLgoKRWwgYXV0b3IgZGlzcG9uZSwgZW4gdG9kbyBjYXNvLCBkZWwgZGVyZWNobyBhIHJldm9jYXIgZXN0YSBhdXRvcml6YWNpw7NuLgoKTGEgY2VzacOzbiBkZSBkZXJlY2hvcyBkZSBlc3RhIG9icmEgc2UgZW5jdWVudHJhIHN1amV0YSBhIGxhIGxlZ2lzbGFjacOzbiB2aWdlbnRlIHNvYnJlIHByb3BpZWRhZCBpbnRlbGVjdHVhbCB5IGRlcmVjaG9zIGRlIGF1dG9yLiBTdSBkaWZ1c2nDs24gZW4gZWwgUmVwb3NpdG9yaW8gc2Vyw6EgYmFqbyBsYSBtb2RhbGlkYWQgZGUgbGljZW5jaWEgQ3JlYXRpdmUgQ29tbW9ucyBvIGVxdWl2YWxlbnRlOiByZWNvbm9jaW1pZW50byDigJMgdXNvIG5vIGNvbWVyY2lhbCDigJMgc2luIG9icmEgZGVyaXZhZGEsIHBvciBsYSBxdWUgc2UgcGVybWl0ZSBoYWNlciBjb3BpYSwgZGlzdHJpYnVpciB5IGNvbXVuaWNhciBww7pibGljYW1lbnRlIGxhIG9icmEgc2llbXByZSBxdWUgc2UgY2l0ZSBhbCBhdXRvciwgZWwgdXNvIHF1ZSBzZSBoYWdhIGRlIGVsbGEgc2VhIG5vIGNvbWVyY2lhbCB5IG5vIHNlIGNyZWVuIG9icmFzIGRlcml2YWRhcyBhIHBhcnRpciBkZSBsYSBvcmlnaW5hbC4K</field>
</element>
</metadata></metadata></record></GetRecord></OAI-PMH>