ConllChainNer

NER tagger for the CoNLL 2003 corpus

Training time: ~3 minutes (on blake, 30 Oct. 4:00pm) tokens per second: 8431.02310444517 docs per second: 48.24287793720109 (avg doc length = 200 tokens)

CoNLL 2003 dev set (eng.testa) OVERALL f1=0.933593 p=0.939802 r=0.927465 (tp=5511 fp=353 fn=431 true=5942 pred=5864) acc=0.985865 (50636/51362) LOC f1=0.965931 p=0.967249 r=0.964616 (tp=1772 fp=60 fn=65 true=1837 pred=1832) MISC f1=0.876404 p=0.909091 r=0.845987 (tp=780 fp=78 fn=142 true=922 pred=858) ORG f1=0.892065 p=0.899848 r=0.884415 (tp=1186 fp=132 fn=155 true=1341 pred=1318) PER f1=0.958897 p=0.955280 r=0.962541 (tp=1773 fp=83 fn=69 true=1842 pred=1856)

CoNLL 2003 test set (eng.testb) OVERALL f1=0.885633 p=0.888315 r=0.882967 (tp=4987 fp=627 fn=661 true=5648 pred=5614) acc=0.973253 (45193/46435) LOC f1=0.915375 p=0.909953 r=0.920863 (tp=1536 fp=152 fn=132 true=1668 pred=1688) MISC f1=0.791034 p=0.803231 r=0.779202 (tp=547 fp=134 fn=155 true=702 pred=681) ORG f1=0.842767 p=0.838498 r=0.847080 (tp=1407 fp=271 fn=254 true=1661 pred=1678) PER f1=0.940327 p=0.955329 r=0.925788 (tp=1497 fp=70 fn=120 true=1617 pred=1567)

Linear Supertypes

ChainNer[BilouConllNerTag], DocumentAnnotator, AnyRef, Any

Known Subclasses

ConllChainNer

Instance Constructors

new ConllChainNer(url: URL = null)

Type Members

class ChainNERFeatures extends BinaryFeatureVectorVariable[String]

Definition Classes
ChainNer
class ChainNERModel[Features <: CategoricalVectorVar[String]] extends ChainModel[L, Features, Token]

Definition Classes
ChainNer

Value Members

final def !=(arg0: Any): Boolean

Definition Classes
AnyRef → Any
final def ##(): Int

Definition Classes
AnyRef → Any
final def ==(arg0: Any): Boolean

Definition Classes
AnyRef → Any
object ChainNERFeaturesDomain extends CategoricalVectorDomain[String]

Definition Classes
ChainNer
object Demonyms extends PhraseLexicon

Definition Classes
ChainNer
def addFeatures(document: Document, vf: (Token) ⇒ CategoricalVectorVar[String]): Unit

Definition Classes
ChainNer
final def asInstanceOf[T0]: T0

Definition Classes
Any
def clone(): AnyRef

Attributes
protected[java.lang]
Definition Classes
AnyRef
Annotations
@throws( ... )
val clusters: Map[String, String]

Definition Classes
ChainNer
def deserialize(stream: InputStream): Unit

Definition Classes
ChainNer
def documentAnnotationString(document: Document): String

How the annotation of this DocumentAnnotator should be printed as extra information after a one-word-per-line (OWPL) format.
How the annotation of this DocumentAnnotator should be printed as extra information after a one-word-per-line (OWPL) format. If there is no document annotation, return the empty string. Used in Document.owplString.

Definition Classes
DocumentAnnotator
final def eq(arg0: AnyRef): Boolean

Definition Classes
AnyRef
def equals(arg0: Any): Boolean

Definition Classes
AnyRef → Any
def evaluationString(documents: Iterable[Document]): Double

Definition Classes
ChainNer
def finalize(): Unit

Attributes
protected[java.lang]
Definition Classes
AnyRef
Annotations
@throws( classOf[java.lang.Throwable] )
final def getClass(): Class[_]

Definition Classes
AnyRef → Any
def hashCode(): Int

Definition Classes
AnyRef → Any
final def isInstanceOf[T0]: Boolean

Definition Classes
Any
def loadDocs(fileName: String): Seq[Document]
def mentionAnnotationString(mention: Mention): String

Definition Classes
DocumentAnnotator
val model: ChainNERModel[ChainNERFeatures]

Definition Classes
ChainNer
final def ne(arg0: AnyRef): Boolean

Definition Classes
AnyRef
final def notify(): Unit

Definition Classes
AnyRef
final def notifyAll(): Unit

Definition Classes
AnyRef
val objective: HammingObjective.type

Definition Classes
ChainNer
def phraseAnnotationString(phrase: Phrase): String

Definition Classes
DocumentAnnotator
def postAttrs: Seq[Class[_]]

Definition Classes
ChainNer → DocumentAnnotator
def prefix(prefixSize: Int, cluster: String): String

Definition Classes
ChainNer
def prereqAttrs: Seq[Class[Sentence]]

Definition Classes
ChainNer → DocumentAnnotator
def printEvaluation(trainDocs: Iterable[Document], testDocs: Iterable[Document], iteration: String): Double

Definition Classes
ChainNer
def process(document: Document): Document

Definition Classes
ConllChainNer → ChainNer → DocumentAnnotator
def processParallel(documents: Iterable[Document], nThreads: Int = ...): Iterable[Document]

Definition Classes
DocumentAnnotator
def processSequential(documents: Iterable[Document]): Iterable[Document]

Definition Classes
DocumentAnnotator
def sampleOutputString(tokens: Iterable[Token]): String

Definition Classes
ChainNer
def serialize(stream: OutputStream): Unit

Definition Classes
ChainNer
final def synchronized[T0](arg0: ⇒ T0): T0

Definition Classes
AnyRef
def toString(): String

Definition Classes
AnyRef → Any
def tokenAnnotationString(token: Token): String

How the annotation of this DocumentAnnotator should be printed in one-word-per-line (OWPL) format.
How the annotation of this DocumentAnnotator should be printed in one-word-per-line (OWPL) format. If there is no per-token annotation, return null. Used in Document.owplString.

Definition Classes
ChainNer → DocumentAnnotator
def train(trainDocs: Seq[Document], testDocs: Seq[Document], rate: Double = 0.18, delta: Double = 0.066)(implicit random: Random): Double

Definition Classes
ChainNer
final def wait(): Unit

Definition Classes
AnyRef
Annotations
@throws( ... )
final def wait(arg0: Long, arg1: Int): Unit

Definition Classes
AnyRef
Annotations
@throws( ... )
final def wait(arg0: Long): Unit

Definition Classes
AnyRef
Annotations
@throws( ... )

class ConllChainNer extends ChainNer[BilouConllNerTag]

Instance Constructors

new ConllChainNer(url: URL = null)

Type Members

class ChainNERFeatures extends BinaryFeatureVectorVariable[String]

class ChainNERModel[Features <: CategoricalVectorVar[String]] extends ChainModel[L, Features, Token]

Value Members

final def !=(arg0: Any): Boolean

final def ##(): Int

final def ==(arg0: Any): Boolean

object ChainNERFeaturesDomain extends CategoricalVectorDomain[String]

object Demonyms extends PhraseLexicon

def addFeatures(document: Document, vf: (Token) ⇒ CategoricalVectorVar[String]): Unit

final def asInstanceOf[T0]: T0

def clone(): AnyRef

val clusters: Map[String, String]

def deserialize(stream: InputStream): Unit

def documentAnnotationString(document: Document): String

final def eq(arg0: AnyRef): Boolean

def equals(arg0: Any): Boolean

def evaluationString(documents: Iterable[Document]): Double

def finalize(): Unit

final def getClass(): Class[_]

def hashCode(): Int

final def isInstanceOf[T0]: Boolean

def loadDocs(fileName: String): Seq[Document]

def mentionAnnotationString(mention: Mention): String

val model: ChainNERModel[ChainNERFeatures]

final def ne(arg0: AnyRef): Boolean

final def notify(): Unit

final def notifyAll(): Unit

val objective: HammingObjective.type

def phraseAnnotationString(phrase: Phrase): String

def postAttrs: Seq[Class[_]]

def prefix(prefixSize: Int, cluster: String): String

def prereqAttrs: Seq[Class[Sentence]]

def printEvaluation(trainDocs: Iterable[Document], testDocs: Iterable[Document], iteration: String): Double

def process(document: Document): Document

def processParallel(documents: Iterable[Document], nThreads: Int = ...): Iterable[Document]

def processSequential(documents: Iterable[Document]): Iterable[Document]

def sampleOutputString(tokens: Iterable[Token]): String

def serialize(stream: OutputStream): Unit

final def synchronized[T0](arg0: ⇒ T0): T0

def toString(): String

def tokenAnnotationString(token: Token): String

def train(trainDocs: Seq[Document], testDocs: Seq[Document], rate: Double = 0.18, delta: Double = 0.066)(implicit random: Random): Double

final def wait(): Unit

final def wait(arg0: Long, arg1: Int): Unit

final def wait(arg0: Long): Unit

Inherited from ChainNer[BilouConllNerTag]

Inherited from DocumentAnnotator

Inherited from AnyRef

Inherited from Any

Ungrouped