package features
TODO
- Alphabetic
- By Inheritance
- features
- AnyRef
- Any
- Hide All
- Show All
- Public
- All
Type Members
- case class ActualWordFeature (f: Feature, dir: Symbol) extends Feature with Product with Serializable
- case class AttachLeft (distance: Int) extends LexFeature with Product with Serializable
- case class AttachRight (distance: Int) extends LexFeature with Product with Serializable
- case class BigramFeature (offset: Int, prev: Feature, next: Feature) extends Feature with Product with Serializable
- case class BilexicalFeature (head: Any, dep: Any) extends Feature with Product with Serializable
- trait BilexicalFeatureAnchoring [W] extends AnyRef
-
trait
BilexicalFeaturizer
[W] extends AnyRef
TODO
-
case class
BrownClusterFeature
(f: String) extends Feature with Serializable with Product
- Annotations
- @SerialVersionUID()
-
case class
BrownClusterFeaturizer
(lengths: Array[Int]) extends WordFeaturizer[String] with Serializable with Product
- Annotations
- @SerialVersionUID()
- case class ContextFeature (f: Feature) extends Feature with Product with Serializable
-
case class
ContextFeaturizer
[W](featurizer: WordFeaturizer[W], window: Int) extends WordFeaturizer[W] with Serializable with Product
Includes all features in a window but doesn't include where the features are.
Includes all features in a window but doesn't include where the features are.
- Annotations
- @SerialVersionUID()
-
class
ContextWordFeaturizer
[W] extends WordFeaturizer[W] with Serializable
- Annotations
- @SerialVersionUID()
-
case class
CrossProductFeature
[A, B](labelPart: A, surfacePart: B, id: String = "") extends Feature with Product with Serializable
- Annotations
- @SerialVersionUID()
-
class
CrossProductIndex
[A, B] extends Index[Feature] with Serializable
- Annotations
- @SerialVersionUID()
- case class DepFeature [P](r: Feature) extends LexFeature with Product with Serializable
-
case class
DigitNormalizedFeature
(w: String) extends Feature with Product with Serializable
- Annotations
- @SerialVersionUID()
- case class DistFeature (distance: Int, f: Any) extends LexFeature with Product with Serializable
-
class
DistanceBinner
extends Serializable
- Annotations
- @SerialVersionUID()
- case class DistanceFeature (distance: Int, label: String = "Span") extends LexFeature with Product with Serializable
-
case class
FirstWordCapsAnd
(f: Feature) extends Feature with Product with Serializable
- Annotations
- @SerialVersionUID()
- class FullWordSpanShapeFeaturizer extends SurfaceFeaturizer[String] with Serializable
-
trait
HackyHeadFinder
[L, T] extends Serializable
HackyHeadFinders find "heads" in a span using only preterminal labels.
HackyHeadFinders find "heads" in a span using only preterminal labels. It doesn't use the syntactic structure of the sentence.
- class HackyLexicalProductionFeaturizer extends RuleAndSpansFeaturizer[String]
- class HackyLexicalSplitFeaturizer [W] extends SplitSpanFeaturizer[W]
-
class
HashExtendingIndex
[T] extends Index[T] with SerializableLogging
TODO
TODO
- Annotations
- @SerialVersionUID()
- case class HashFeature (hashBucket: Int) extends Feature with Product with Serializable
- case class HeadDepFeature [P](head: Feature, dep: Feature) extends LexFeature with Product with Serializable
- case class HeadFeature [P](r: Feature) extends LexFeature with Product with Serializable
- case class HeadPairDistanceRuleFeature (rule: Int, lsuff: String, rsuff: String, distance: Int) extends Feature with Product with Serializable
-
class
IdentityWordFeaturizer
[W] extends WordFeaturizer[W] with Serializable
- Annotations
- @SerialVersionUID()
- trait IndexBuilder [F] extends AnyRef
- trait IndexedBilexicalFeatureAnchoring [W] extends AnyRef
- trait IndexedBilexicalFeaturizer [W] extends AnyRef
- trait IndexedSplitSpanFeatureAnchoring [W] extends IndexedSurfaceAnchoring[W]
- trait IndexedSplitSpanFeaturizer [W] extends AnyRef
- trait IndexedSurfaceAnchoring [W] extends AnyRef
- trait IndexedSurfaceFeaturizer [W] extends AnyRef
- trait IndexedWordAnchoring [W] extends AnyRef
- trait IndexedWordFeaturizer [W] extends AnyRef
-
case class
IndicatorFeature
(a: Any) extends Feature with CachedHashCode with Product with Serializable
TODO
TODO
- Annotations
- @SerialVersionUID()
-
final
case class
IndicatorWSFeature
(name: Symbol) extends Feature with Product with Serializable
- Annotations
- @SerialVersionUID()
-
case class
LabelFeature
[L](l: L) extends Feature with CachedHashCode with Product with Serializable
TODO
- case class LeftHeadDistanceRuleFeature (rule: Int, lsuff: String, distance: Int) extends Feature with Product with Serializable
- case class LeftTagDistanceRuleFeature (rule: Int, ltag: String, distance: Int) extends Feature with Product with Serializable
-
final
case class
LeftWordFeature
(str: Any) extends Feature with Product with Serializable
- Annotations
- @SerialVersionUID()
- trait LexFeature extends Feature
-
class
LongestFrequentSuffixFeaturizer
extends WordFeaturizer[String] with Serializable
TODO
- class MinimalWordFeaturizer extends WordFeaturizer[String] with Serializable
- class MorphFeaturizer extends WordFeaturizer[String] with Serializable
-
case class
MultiSurfaceFeaturizer
[W](feats: IndexedSeq[SurfaceFeaturizer[W]]) extends SurfaceFeaturizer[W] with Serializable with Product
- Annotations
- @SerialVersionUID()
-
case class
MultiWordFeaturizer
[W](featurizers: IndexedSeq[WordFeaturizer[W]]) extends WordFeaturizer[W] with Serializable with Product
- Annotations
- @SerialVersionUID()
- case class NGramBigramFeature (idx: Int) extends Feature with Product with Serializable
- case class NGramFeature (n: Int, idx: Int) extends Feature with Product with Serializable
-
class
NGramSpanFeaturizer
extends SurfaceFeaturizer[String] with Serializable
- Annotations
- @SerialVersionUID()
- case class NGramUnigramFeature (idx: Int) extends Feature with Product with Serializable
- class NGramWordFeaturizer [W] extends WordFeaturizer[W]
- class NextActualWordFeaturizer extends WordFeaturizer[String] with Serializable
-
class
NonRedundantIndexBuilder
[F] extends IndexBuilder[F]
TODO
-
class
NormalIndexBuilder
[F] extends IndexBuilder[F]
TODO
- case class NotFeature (idx: Int) extends Feature with Product with Serializable
-
case class
NthWordCapsAnd
(f: Feature) extends Feature with Product with Serializable
- Annotations
- @SerialVersionUID()
-
case class
OffsetFeature
(offset: Int, feature: Feature) extends Feature with Product with Serializable
- Annotations
- @SerialVersionUID()
-
class
OffsetWordFeaturizer
[W] extends WordFeaturizer[W] with Serializable
- Annotations
- @SerialVersionUID()
- case class OrientedNGramFeature (offset: Int, features: IndexedSeq[Feature]) extends Feature with CachedHashCode with Product with Serializable
-
class
PorterStemmer
extends (String) ⇒ String
Converts words to their stemmed form using the classic Porter stemming algorithm.
-
final
case class
PrefixFeature
(str: String) extends Feature with Product with Serializable
- Annotations
- @SerialVersionUID()
-
class
ProductIndexedBilexicalFeaturizer
[W] extends IndexedBilexicalFeaturizer[W] with Serializable
- Annotations
- @SerialVersionUID()
-
class
ProductSurfaceFeaturizer
[W] extends SurfaceFeaturizer[W] with Serializable
- Annotations
- @SerialVersionUID()
-
class
ProductWordFeaturizer
[W] extends WordFeaturizer[W] with Serializable
- Annotations
- @SerialVersionUID()
- case class PunctuationFeature (f: Feature, dir: Symbol) extends Feature with Product with Serializable
- case class RightHeadDistanceRuleFeature (rule: Int, rsuff: String, distance: Int) extends Feature with Product with Serializable
- case class RightTagDistanceRuleFeature (rule: Int, rtag: String, distance: Int) extends Feature with Product with Serializable
-
final
case class
RightWordFeature
(str: Any) extends Feature with Product with Serializable
- Annotations
- @SerialVersionUID()
- trait RuleAndSpansFeaturizer [W] extends Serializable
- case class RuleBasedHackyHeadFinder () extends HackyHeadFinder[String, String] with Product with Serializable
-
final
case class
SeenWithTagFeature
(str: Any) extends Feature with Product with Serializable
- Annotations
- @SerialVersionUID()
-
class
SegmentedIndex
[T, IndexType] extends Index[Feature]
- Annotations
- @SerialVersionUID()
-
case class
SentenceLengthFeature
(length: Int) extends Feature with Product with Serializable
- Annotations
- @SerialVersionUID()
-
class
SentencePropertiesFeaturizer
extends WordFeaturizer[String] with SurfaceFeaturizer[String] with Serializable
- Annotations
- @SerialVersionUID()
-
final
case class
ShapeFeature
(str: String) extends Feature with Product with Serializable
- Annotations
- @SerialVersionUID()
-
final
case class
SignatureFeature
(str: String) extends Feature with Product with Serializable
- Annotations
- @SerialVersionUID()
- case class SpanEdgeFeature (mp1: MarkerPos, mp2: MarkerPos, f1: Feature, f2: Feature) extends Feature with Product with Serializable
- trait SpanFeature extends Feature
-
case class
SpanLengthFeature
(dist: Int) extends Feature with Product with Serializable
- Annotations
- @SerialVersionUID()
-
class
SpanLengthFeaturizer
extends SurfaceFeaturizer[String] with Serializable
- Annotations
- @SerialVersionUID()
- case class SpanRelativeFeature (f: Feature, mp: MarkerPos) extends Feature with Product with Serializable
- case class SpanShapeFeature (shape: String) extends SpanFeature with Product with Serializable
-
class
SpanShapeFeaturizer
extends SurfaceFeaturizer[String] with Serializable
- Annotations
- @SerialVersionUID()
- class SpanShapeFeaturizerBetter extends SurfaceFeaturizer[String] with Serializable
- case class SplitFeature (x: Feature) extends Feature with Product with Serializable
- trait SplitSpanFeatureAnchoring [W] extends SurfaceFeatureAnchoring[W]
-
trait
SplitSpanFeaturizer
[W] extends SurfaceFeaturizer[W]
TODO
-
final
case class
SuffixFeature
(str: String) extends Feature with Product with Serializable
- Annotations
- @SerialVersionUID()
- trait SurfaceFeatureAnchoring [W] extends AnyRef
-
trait
SurfaceFeaturizer
[W] extends Serializable
TODO
-
class
TabulatedIndexedSurfaceAnchoring
[W] extends IndexedSurfaceAnchoring[W] with Serializable
- Annotations
- @SerialVersionUID()
-
class
TabulatedIndexedWordAnchoring
[W] extends IndexedWordAnchoring[W] with Serializable
- Annotations
- @SerialVersionUID()
-
class
TagDictionaryFeaturizer
[L] extends WordFeaturizer[String] with Serializable
TODO
TODO
- Annotations
- @SerialVersionUID()
- case class TagSpanShapeFeature (featType: Int, shape: String) extends SpanFeature with Product with Serializable
-
class
TagSpanShapeFeaturizer
[L] extends SurfaceFeaturizer[String] with Serializable
- Annotations
- @SerialVersionUID()
- case class TransformedFeature (w: Any) extends Feature with Product with Serializable
- class TransformedWordFeaturizer [W] extends WordFeaturizer[W] with Serializable
- class WordClassFeaturizer extends WordFeaturizer[String] with Serializable
-
case class
WordFeature
(word: Any, kind: Symbol) extends Feature with Product with Serializable
- Annotations
- @SerialVersionUID()
- trait WordFeatureAnchoring [W] extends AnyRef
- trait WordFeaturizer [W] extends AnyRef
-
class
WordPrefixFeaturizer
extends WordFeaturizer[String] with Serializable
- Annotations
- @SerialVersionUID()
-
class
WordPropertyFeaturizer
extends WordFeaturizer[String] with Serializable
- Annotations
- @SerialVersionUID()
-
class
WordShapeFeaturizer
extends WordFeaturizer[String] with Serializable
- Annotations
- @SerialVersionUID()
-
class
WordSuffixFeaturizer
extends WordFeaturizer[String] with Serializable
- Annotations
- @SerialVersionUID()
- class ZeroFeaturizer [W] extends WordFeaturizer[W] with SurfaceFeaturizer[W] with Serializable
- class ZeroRuleAndSpansFeaturizer [W] extends RuleAndSpansFeaturizer[W]
Value Members
- def buildNonRedundantFeatureIndex[T, F](it: TraversableOnce[T], gen: (T) ⇒ TraversableOnce[F]): Index[F]
- object AttachLeft extends LexFeature with Product with Serializable
- object AttachRight extends LexFeature with Product with Serializable
- object BeginSentFeature extends Feature with Product with Serializable
- object BilexicalFeaturizer
-
object
BoundaryFeature
extends Feature with Product with Serializable
- Annotations
- @SerialVersionUID()
- object BrownClusters
- object CrossProductIndex extends Serializable
- object DistanceBinner extends Serializable
- object EndSentFeature extends Feature with Product with Serializable
-
object
EnglishWordClassGenerator
extends (String) ⇒ String with Serializable
Converts a string into another string with properties of that string Useful for rare or 0 count words
Converts a string into another string with properties of that string Useful for rare or 0 count words
- Annotations
- @SerialVersionUID()
- object HackyHeadFinderTest
- object HackyLexicalProductionFeaturizer extends Serializable
- object HashFeature extends Serializable
-
object
HierarchicalClusters
TODO
- object IndexedBilexicalFeaturizer
- object IndexedSplitSpanFeaturizer
- object IndexedSurfaceFeaturizer
- object IndexedWordFeaturizer
- object LongestFrequentSuffixFeaturizer extends Serializable
- object MorphFeaturizer extends Serializable
- object NGramSpanFeaturizer extends Serializable
-
object
PorterStemmer
extends PorterStemmer
Converts words to their stemmed form using the classic Porter stemming algorithm.
- object RuleAndSpansFeaturizer extends Serializable
- object RuleBasedHackyHeadFinder extends Serializable
- object SegmentedIndex extends Serializable
- object SpanShapeGenerator extends Serializable
- object SplitSpanFeaturizer extends Serializable
-
object
StandardSpanFeatures
extends Serializable
- Annotations
- @SerialVersionUID()
- object SurfaceFeaturizer extends Serializable
- object TagDictionaryFeaturizer extends Serializable
- object TagSpanShapeGenerator extends Serializable
- object WholeSentFeature extends Feature with Product with Serializable
-
object
WholeSentenceIsUpperCaseFeature
extends Feature with Product with Serializable
- Annotations
- @SerialVersionUID()
- object WordFeaturizer
- object WordPropertyFeaturizer extends Serializable
-
object
WordShapeGenerator
extends (String) ⇒ String with Serializable
Generates "word-shapes" that track capitalization patterns and character type patterns.
Generates "word-shapes" that track capitalization patterns and character type patterns. e.g.