changelog shortlog graph tags branches changeset file revisions annotate raw help

Mercurial > core / lisp/lib/nlp/tokenize.lisp

revision 96: 301fd45bbe73
parent 54: 83f6c62bf2a8
child 495: 7120877e0453
     1.1--- a/lisp/lib/nlp/tokenize.lisp	Mon Dec 11 22:54:13 2023 -0500
     1.2+++ b/lisp/lib/nlp/tokenize.lisp	Wed Dec 13 20:02:36 2023 -0500
     1.3@@ -1,5 +1,5 @@
     1.4 (defpackage :nlp/tokenize
     1.5-  (:use :cl :std :std/str :cl-ppcre :nlp/data :nlp/stem/porter)
     1.6+  (:use :cl :std :cl-ppcre :nlp/data :nlp/stem/porter)
     1.7   (:export :word-tokenize :sentence-tokenize))
     1.8 
     1.9 (in-package :nlp/tokenize)
    1.10@@ -25,4 +25,4 @@
    1.11   "Split a string into a list of sentences."
    1.12   ;; TODO: Use "\\p{Terminal_Punctuation}" regexp instead to catch all terminal
    1.13   ;; punctuation marks, including "," and ";"?
    1.14-  (remove "" (mapcar #'std/str:trim (cl-ppcre:split "[.!?]" string)) :test #'equal))
    1.15+  (remove "" (mapcar #'std:trim (cl-ppcre:split "[.!?]" string)) :test #'equal))