Permalink
Browse files

The lexicon file is iso-8859-1 not ascii. Now works with SBCL.

  • Loading branch information...
1 parent 1d43de0 commit 192bb3010f6ddb02174e3660e06699097bf96989 @ActiveWebSolutions ActiveWebSolutions committed Oct 18, 2012
Showing with 2 additions and 2 deletions.
  1. +2 −2 src/lexicon.lisp
View
@@ -34,14 +34,14 @@
(with-static-memory-allocation ()
(write-log lexicon-init "Reading lexicon from ~A" lexicon-file)
;; Parse the lines into a predicate ID and two node structures
- (with-open-file ( s lexicon-file :external-format :ascii)
+ (with-open-file ( s lexicon-file :external-format :iso-8859-1)
(do-count-contentful-lines (l count s)
(when (= (mod count 10000) 0) (write-log lexicon-init "Processed ~A lines" count))
(let ((lexicon-entry (extract-words l))) ;; (pregex:split "\\s+" l)))
(add-basic-entry (car lexicon-entry) (mapcar #'mkkeysym (cdr lexicon-entry))))))
(write-log lexicon-init "Reading word->lemma data from ~A" lemma-file)
;; Parse the lines into a predicate ID and possible roots
- (with-open-file ( s lemma-file :external-format :ascii)
+ (with-open-file ( s lemma-file :external-format :iso-8859-1)
(do-count-contentful-lines (l count s)
(when (= (mod count 10000) 0) (write-log lexicon-init "Processed ~A lines" count))
(let ((roots-entry (extract-words l)))

0 comments on commit 192bb30

Please sign in to comment.