lib/tomoto/lda.rb in tomoto-0.1.0 vs lib/tomoto/lda.rb in tomoto-0.1.1
- old
+ new
@@ -13,13 +13,11 @@
model._load(filename)
model
end
def add_doc(doc)
- raise "cannot add_doc() after train()" if defined?(@prepared)
- doc = doc.split(/[[:space:]]+/) unless doc.is_a?(Array)
- _add_doc(doc)
+ _add_doc(prepare_doc(doc))
end
def count_by_topics
prepare
_count_by_topics
@@ -45,16 +43,26 @@
def train(iterations = 10, workers: 0)
prepare
_train(iterations, workers)
end
+ def tw
+ TERM_WEIGHT[_tw]
+ end
+
private
def prepare
unless defined?(@prepared)
_prepare(@min_cf, @min_df, @rm_top)
@prepared = true
end
+ end
+
+ def prepare_doc(doc)
+ raise "cannot add_doc() after train()" if defined?(@prepared)
+ doc = doc.split(/[[:space:]]+/) unless doc.is_a?(Array)
+ doc
end
class << self
private