<?xml version="1.0" encoding="UTF-8"?>
<oai_dc:dc xmlns:oai_dc="http://www.openarchives.org/OAI/2.0/oai_dc/" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xsi:schemaLocation="http://www.openarchives.org/OAI/2.0/oai_dc/ http://www.openarchives.org/OAI/2.0/oai_dc.xsd">
  <dc:title>Mixed N-Grams and Unigram Sequence Segmentation</dc:title>
  <dc:title>R package NUSS version 0.1.0</dc:title>
  <dc:description>Segmentation of short text sequences - like hashtags - into the
    separated words sequence, done with the use of dictionary, which may be
    built on custom corpus of texts. Unigram dictionary is used to find most
    probable sequence, and n-grams approach is used to determine possible
    segmentation given the text corpus.</dc:description>
  <dc:type>Software</dc:type>
  <dc:relation>Depends: R (&gt;= 3.5)</dc:relation>
  <dc:relation>Imports: dplyr, magrittr, Rcpp, stringr, text2vec, textclean, utils</dc:relation>
  <dc:relation>LinkingTo: BH, Rcpp</dc:relation>
  <dc:relation>Suggests: testthat (&gt;= 3.0.0)</dc:relation>
  <dc:creator>Oskar Kosch &lt;contact@oskarkosch.com&gt;</dc:creator>
  <dc:publisher>Comprehensive R Archive Network (CRAN)</dc:publisher>
  <dc:contributor>Oskar Kosch [aut, cre] (ORCID: &lt;https://orcid.org/0000-0003-2697-1393&gt;)</dc:contributor>
  <dc:rights>GPL (&gt;= 3)</dc:rights>
  <dc:date>2024-08-19</dc:date>
  <dc:format>application/tgz</dc:format>
  <dc:identifier>https://CRAN.R-project.org/package=NUSS</dc:identifier>
  <dc:identifier>doi:10.32614/CRAN.package.NUSS</dc:identifier>
  <dc:language>en</dc:language>
</oai_dc:dc>
