islex package

Submodules

islex.load module

class islex.load.CaseInsensitiveMapping(backing_store)[source]

Bases: islex.load.ReadOnlyMapping

class islex.load.ReadOnlyMapping(backing_store)[source]

Bases: _abcoll.Mapping

islex.load.ortho_mapping(module)[source]
islex.load.stream_from_fh(fh, clean=False)[source]
islex.load.write_package_data()[source]

islex.tokens module

class islex.tokens.EntityCategory[source]

Bases: enum.Enum

BOYNAME = <EntityCategory.BOYNAME: 13>
CITY = <EntityCategory.CITY: 2>
COMPANY = <EntityCategory.COMPANY: 9>
CONTINENT = <EntityCategory.CONTINENT: 6>
COUNTRY = <EntityCategory.COUNTRY: 5>
EVENT = <EntityCategory.EVENT: 4>
GIRLNAME = <EntityCategory.GIRLNAME: 14>
MONTH = <EntityCategory.MONTH: 12>
ORGANIZATION = <EntityCategory.ORGANIZATION: 8>
PERSON = <EntityCategory.PERSON: 7>
PLACE = <EntityCategory.PLACE: 10>
PRODUCT = <EntityCategory.PRODUCT: 1>
STATE = <EntityCategory.STATE: 11>
SURNAME = <EntityCategory.SURNAME: 3>
UNSPECIFIED_ENTITY = <EntityCategory.UNSPECIFIED_ENTITY: 0>
class islex.tokens.Morph(emes)[source]

Bases: object

Contains a morphological analysis of the corresponding ortho.

May be more than one in a word, e.g. axes -> (ax + s), (axe + s)

emes = Attribute(name='emes', default=NOTHING, validator=<instance_of validator for type <type 'tuple'>>, repr=True, cmp=True, hash=True, init=True, convert=None)
classmethod from_string(s)[source]
to_string()[source]
class islex.tokens.Phone(value=<instance_of validator for type <type 'unicode'>>)[source]

Bases: object

Contains a cluster of IPA characters indicating a single phone(me).

value = Attribute(name='value', default=<instance_of validator for type <type 'unicode'>>, validator=None, repr=True, cmp=True, hash=True, init=True, convert=None)
class islex.tokens.Pos(category, entity_type=None)[source]

Bases: object

Contains part of speech information and (possibly) entity category.

category = Attribute(name='category', default=NOTHING, validator=<instance_of validator for type <enum 'PosCategory'>>, repr=True, cmp=True, hash=True, init=True, convert=None)
entity_type = Attribute(name='entity_type', default=None, validator=<optional validator for <instance_of validator for type <enum 'EntityCategory'>> or None>, repr=True, cmp=True, hash=True, init=True, convert=None)
classmethod from_string(t)[source]
to_string()[source]
class islex.tokens.PosCategory[source]

Bases: enum.Enum

Enumeration of possible POS tags.

ABBREVIATION = <PosCategory.ABBREVIATION: 80>
CC = <PosCategory.CC: 58>
CD = <PosCategory.CD: 52>
DT = <PosCategory.DT: 50>
EX = <PosCategory.EX: 51>
FW = <PosCategory.FW: 21>
IN = <PosCategory.IN: 54>
JJ = <PosCategory.JJ: 6>
JJR = <PosCategory.JJR: 7>
JJS = <PosCategory.JJS: 8>
LS = <PosCategory.LS: 20>
MD = <PosCategory.MD: 53>
NN = <PosCategory.NN: 4>
NNP = <PosCategory.NNP: 15>
NNPS = <PosCategory.NNPS: 16>
NNS = <PosCategory.NNS: 5>
OF = <PosCategory.OF: 56>
PDT = <PosCategory.PDT: 59>
PRP = <PosCategory.PRP: 57>
PUNC = <PosCategory.PUNC: 82>
RB = <PosCategory.RB: 1>
RBR = <PosCategory.RBR: 2>
RBS = <PosCategory.RBS: 3>
RP = <PosCategory.RP: 63>
SYM = <PosCategory.SYM: 81>
TO = <PosCategory.TO: 55>
UH = <PosCategory.UH: 22>
UNUSED_POSTAG = <PosCategory.UNUSED_POSTAG: 0>
VB = <PosCategory.VB: 9>
VBD = <PosCategory.VBD: 10>
VBG = <PosCategory.VBG: 11>
VBN = <PosCategory.VBN: 13>
VBP = <PosCategory.VBP: 12>
VBZ = <PosCategory.VBZ: 14>
WDT = <PosCategory.WDT: 61>
WP = <PosCategory.WP: 62>
WRB = <PosCategory.WRB: 60>
class islex.tokens.Pron(sylls)[source]

Bases: object

classmethod from_string(s, clean=False)[source]
ipa
sylls = Attribute(name='sylls', default=NOTHING, validator=<instance_of validator for type <type 'tuple'>>, repr=True, cmp=True, hash=True, init=True, convert=None)
to_string()[source]
class islex.tokens.Syllable(phones=<instance_of validator for type <type 'tuple'>>)[source]

Bases: object

classmethod from_string(s)[source]
ipa
phones = Attribute(name='phones', default=<instance_of validator for type <type 'tuple'>>, validator=None, repr=True, cmp=True, hash=True, init=True, convert=None)
to_string()[source]
class islex.tokens.Word(ortho, pos, morphs, prons)[source]

Bases: object

classmethod from_string(s, clean=False)[source]
ipa
morphs = Attribute(name='morphs', default=NOTHING, validator=<instance_of validator for type <type 'tuple'>>, repr=True, cmp=True, hash=True, init=True, convert=None)
ortho = Attribute(name='ortho', default=NOTHING, validator=None, repr=True, cmp=True, hash=True, init=True, convert=None)
ortho_patt = <_sre.SRE_Pattern object>
pos = Attribute(name='pos', default=NOTHING, validator=<instance_of validator for type <type 'tuple'>>, repr=True, cmp=True, hash=True, init=True, convert=None)
prons = Attribute(name='prons', default=NOTHING, validator=<instance_of validator for type <type 'tuple'>>, repr=True, cmp=True, hash=True, init=True, convert=None)
to_string()[source]

Module contents