axle.lx
TFIDFDocumentVectorSpace
class
TFIDFDocumentVectorSpace
extends DocumentVectorSpace
Instance Constructors
-
new
TFIDFDocumentVectorSpace
(_stopwords: Set[String], corpus: List[String])
Type Members
-
type
TV
= Map[String, Int]
Value Members
-
def
!=
(arg0: AnyRef): Boolean
-
def
!=
(arg0: Any): Boolean
-
def
##
(): Int
-
def
==
(arg0: AnyRef): Boolean
-
def
==
(arg0: Any): Boolean
-
lazy val
_vectors
: IndexedSeq[TV]
-
def
asInstanceOf
[T0]
: T0
-
def
clone
(): AnyRef
-
lazy val
df
: Map[String, Int]
-
def
doc2vector
(doc: String): TV
-
def
dotProduct
(v1: TV, v2: TV): Double
-
def
eq
(arg0: AnyRef): Boolean
-
def
equals
(arg0: Any): Boolean
-
def
finalize
(): Unit
-
def
getClass
(): java.lang.Class[_]
-
def
hashCode
(): Int
-
def
isInstanceOf
[T0]
: Boolean
-
def
length
(v: TV): Double
-
def
mrWordCount
(is: Iterator[String]): Map[String, Int]
-
def
mrWordExistsCount
(is: Iterator[String]): Map[String, Int]
-
def
nMostSimilar
(query: String, n: Int): List[(Int, Double)]
-
def
ne
(arg0: AnyRef): Boolean
-
def
notify
(): Unit
-
def
notifyAll
(): Unit
-
lazy val
numDocs
: Int
-
def
similarity
(v1: TV, v2: TV): Double
-
def
similarityMatrix
(): Matrix[Double]
-
def
square
(x: Double): Double
-
def
stopwords
(): Set[String]
-
def
synchronized
[T0]
(arg0: ⇒ T0): T0
-
def
termWeight
(term: String, doc: TV): Double
-
def
toString
(): String
-
def
vectors
(): IndexedSeq[TV]
-
def
wait
(): Unit
-
def
wait
(arg0: Long, arg1: Int): Unit
-
def
wait
(arg0: Long): Unit
-
val
whitespace
: Regex
Inherited from AnyRef
Inherited from Any