From b5f92c5ced4ab9d6ac3fdb494d62e4ba7e529d1e Mon Sep 17 00:00:00 2001 From: Joshua Eckroth Date: Wed, 17 Jul 2013 00:41:02 -0400 Subject: [PATCH] Support :normalize option in docs-to-dataset --- src/clj_ml/data.clj | 2 ++ 1 file changed, 2 insertions(+) diff --git a/src/clj_ml/data.clj b/src/clj_ml/data.clj index 21d7f54..5e8aa04 100644 --- a/src/clj_ml/data.clj +++ b/src/clj_ml/data.clj @@ -534,6 +534,7 @@ split immediately you can use do-split-dataset." :lowercase (:lowercase parsed-opts true) :prefix "title-" :words-to-keep (:words-to-keep parsed-opts 1000) :counts (:counts parsed-opts false) + :normalize (:normalize parsed-opts false) :transform-tf (:transform-tf parsed-opts true) :transform-idf (:transform-idf parsed-opts true) :stemmer (if (:stemmer parsed-opts false) @@ -549,6 +550,7 @@ split immediately you can use do-split-dataset." :lowercase (:lowercase parsed-opts true) :prefix "fulltext-" :words-to-keep (:words-to-keep parsed-opts 1000) :counts (:counts parsed-opts false) + :normalize (:normalize parsed-opts false) :transform-tf (:transform-tf parsed-opts true) :transform-idf (:transform-idf parsed-opts true) :stemmer (if (:stemmer parsed-opts false)