<?xml version="1.0" encoding="UTF-8"?>
<oai_dc:dc xmlns:oai_dc="http://www.openarchives.org/OAI/2.0/oai_dc/" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xsi:schemaLocation="http://www.openarchives.org/OAI/2.0/oai_dc/ http://www.openarchives.org/OAI/2.0/oai_dc.xsd">
  <dc:title>Fast Searching for Multiple Keywords in Multiple Texts</dc:title>
  <dc:title>R package AhoCorasickTrie version 0.1.3</dc:title>
  <dc:description>Aho-Corasick is an optimal algorithm for finding many
    keywords in a text. It can locate all matches in a text in O(N+M) time; i.e.,
    the time needed scales linearly with the number of keywords (N) and the size of
    the text (M). Compare this to the naive approach which takes O(N*M) time to loop
    through each pattern and scan for it in the text. This implementation builds the
    trie (the generic name of the data structure) and runs the search in a single
    function call. If you want to search multiple texts with the same trie, the
    function will take a list or vector of texts and return a list of matches to
    each text. By default, all 128 ASCII characters are allowed in both the keywords
    and the text. A more efficient trie is possible if the alphabet size can be
    reduced. For example, DNA sequences use at most 19 distinct characters and
    usually only 4; protein sequences use at most 26 distinct characters and usually
    only 20. UTF-8 (Unicode) matching is not currently supported.</dc:description>
  <dc:type>Software</dc:type>
  <dc:relation>Imports: Rcpp (&gt;= 0.12.5)</dc:relation>
  <dc:relation>LinkingTo: Rcpp</dc:relation>
  <dc:relation>Suggests: microbenchmark, testthat</dc:relation>
  <dc:creator>Matt Chambers &lt;matt.chambers42@gmail.com&gt;</dc:creator>
  <dc:publisher>Comprehensive R Archive Network (CRAN)</dc:publisher>
  <dc:contributor>Matt Chambers [aut, cre],
  Tomas Petricek [aut, cph],
  Vanderbilt University [cph]</dc:contributor>
  <dc:rights>Apache License 2.0</dc:rights>
  <dc:date>2025-02-05</dc:date>
  <dc:format>application/tgz</dc:format>
  <dc:identifier>https://CRAN.R-project.org/package=AhoCorasickTrie</dc:identifier>
  <dc:identifier>doi:10.32614/CRAN.package.AhoCorasickTrie</dc:identifier>
</oai_dc:dc>
