|
||||||||||
PREV CLASS NEXT CLASS | FRAMES NO FRAMES | |||||||||
SUMMARY: NESTED | FIELD | CONSTR | METHOD | DETAIL: FIELD | CONSTR | METHOD |
java.lang.Objectedu.umass.cs.mallet.base.fst.Transducer
edu.umass.cs.mallet.base.fst.CRF4
Nested Class Summary | |
class |
CRF4.MaximizableCRF
|
static class |
CRF4.State
|
protected static class |
CRF4.TransitionIterator
|
Nested classes inherited from class edu.umass.cs.mallet.base.fst.Transducer |
Transducer.BeamLattice, Transducer.Lattice, Transducer.ViterbiLattice, Transducer.ViterbiPath, Transducer.ViterbiPath_NBest, Transducer.ViterbiPathBeam, Transducer.ViterbiPathBeamB, Transducer.ViterbiPathBeamFB, Transducer.ViterbiPathBeamKL |
Field Summary | |
boolean |
printGradient
|
protected boolean |
someTrainingDone
|
static int |
VITERBI
|
static int |
VITERBI_BBEAM
|
static int |
VITERBI_FBBEAM
|
static int |
VITERBI_FBEAM
|
static int |
VITERBI_FBEAMKL
|
Fields inherited from class edu.umass.cs.mallet.base.fst.Transducer |
INFINITE_COST, inputPipe, outputPipe, ZERO_COST |
Constructor Summary | |
CRF4(Alphabet inputAlphabet,
Alphabet outputAlphabet)
|
|
CRF4(CRF4 other)
Create a CRF whose states and weights are a copy of noes from another CRF. |
|
CRF4(Pipe inputPipe,
Pipe outputPipe)
|
Method Summary | |
void |
addFullyConnectedStates(java.lang.String[] stateNames)
|
void |
addFullyConnectedStatesForBiLabels()
|
void |
addFullyConnectedStatesForLabels()
|
void |
addFullyConnectedStatesForThreeQuarterLabels(InstanceList trainingSet)
|
void |
addFullyConnectedStatesForTriLabels()
|
java.lang.String |
addOrderNStates(InstanceList trainingSet,
int[] orders,
boolean[] defaults,
java.lang.String start,
java.util.regex.Pattern forbidden,
java.util.regex.Pattern allowed,
boolean fullyConnected)
Assumes that the CRF's output alphabet contains String s. |
void |
addSelfTransitioningStateForAllLabels(java.lang.String name)
|
void |
addStartState()
|
void |
addStartState(java.lang.String name)
|
void |
addState(java.lang.String name,
double initialCost,
double finalCost,
java.lang.String[] destinationNames,
java.lang.String[] labelNames)
|
void |
addState(java.lang.String name,
double initialCost,
double finalCost,
java.lang.String[] destinationNames,
java.lang.String[] labelNames,
java.lang.String[] weightNames)
|
void |
addState(java.lang.String name,
double initialCost,
double finalCost,
java.lang.String[] destinationNames,
java.lang.String[] labelNames,
java.lang.String[][] weightNames)
|
void |
addState(java.lang.String name,
java.lang.String[] destinationNames)
|
void |
addStatesForBiLabelsConnectedAsIn(InstanceList trainingSet)
Add states to create a second-order Markov model on labels, adding only those transitions the occur in the given trainingSet. |
void |
addStatesForHalfLabelsConnectedAsIn(InstanceList trainingSet)
Add as many states as there are labels, but don't create separate weights for each source-destination pair of states. |
void |
addStatesForLabelsConnectedAsIn(InstanceList trainingSet)
Add states to create a first-order Markov model on labels, adding only those transitions the occur in the given trainingSet. |
void |
addStatesForThreeQuarterLabelsConnectedAsIn(InstanceList trainingSet)
Add as many states as there are labels, but don't create separate observational-test-weights for each source-destination pair of states---instead have all the incoming transitions to a state share the same observational-feature-test weights. |
void |
estimate()
|
void |
evaluate(TransducerEvaluator eval,
InstanceList testing)
This method is deprecated. |
void |
freezeWeights(int weightsIndex)
Freezes a set of weights to their current values. |
void |
freezeWeights(java.lang.String weightsName)
Freezes a set of weights to their current values. |
double[] |
getDefaultWeights()
|
double |
getGaussianPriorVariance()
|
Alphabet |
getInputAlphabet()
|
CRF4.MaximizableCRF |
getMaximizableCRF(InstanceList ilist)
|
Alphabet |
getOutputAlphabet()
|
double |
getParameter(int sourceStateIndex,
int destStateIndex,
int featureIndex,
double value)
Only gets the parameter from the first group of parameters. |
double |
getParametersAbsNorm()
|
Transducer.State |
getState(int index)
|
CRF4.State |
getState(java.lang.String name)
|
int |
getTransductionType()
|
double |
getUseHyperbolicPriorSharpness()
|
double |
getUseHyperbolicPriorSlope()
|
boolean |
getUseSparseWeights()
|
SparseVector[] |
getWeights()
|
SparseVector |
getWeights(int weightIndex)
|
SparseVector |
getWeights(java.lang.String weightName)
|
int |
getWeightsIndex(java.lang.String weightName)
Increase the size of the weights[] parameters to match (a new, larger) input Alphabet size |
java.lang.String |
getWeightsName(int weightIndex)
|
java.util.Iterator |
initialStateIterator()
|
boolean |
isTrainable()
|
protected CRF4.State |
newState(java.lang.String name,
int index,
double initialCost,
double finalCost,
java.lang.String[] destinationNames,
java.lang.String[] labelNames,
java.lang.String[][] weightNames,
CRF4 crf)
|
int |
numStates()
|
Sequence[] |
predict(InstanceList testing)
This method is deprecated. |
void |
print()
|
void |
print(java.io.PrintWriter out)
|
void |
reset()
|
void |
setAsStartState(CRF4.State state)
|
void |
setDefaultWeight(int widx,
double val)
|
void |
setDefaultWeights(double[] w)
|
void |
setFeatureSelection(int weightIdx,
FeatureSelection fs)
|
void |
setGaussianPriorVariance(double p)
|
void |
setHyperbolicPriorSharpness(double p)
|
void |
setHyperbolicPriorSlope(double p)
|
void |
setParameter(int sourceStateIndex,
int destStateIndex,
int featureIndex,
double value)
Only sets the parameter from the first group of parameters. |
void |
setTrainable(boolean f)
|
void |
setTransductionType(int transductionType)
|
void |
setUseHyperbolicPrior(boolean f)
|
void |
setUseSomeUnsupportedTrick(boolean b)
Sets whether to use the 'some unsupported trick.' This trick is, if training a CRF where some training has been done and sparse weights are used, to add a few weights for feaures that do not occur in the tainig data. |
void |
setUseSparseWeights(boolean b)
|
void |
setWeights(int weightsIndex,
SparseVector transitionWeights)
|
void |
setWeights(SparseVector[] m)
|
void |
setWeights(java.lang.String weightName,
SparseVector transitionWeights)
|
void |
setWeightsDimensionAsIn(InstanceList trainingData)
|
void |
setWeightsDimensionDensely()
|
boolean |
train(InstanceList ilist)
|
boolean |
train(InstanceList ilist,
InstanceList validation,
InstanceList testing)
|
boolean |
train(InstanceList ilist,
InstanceList validation,
InstanceList testing,
TransducerEvaluator eval)
|
boolean |
train(InstanceList ilist,
InstanceList validation,
InstanceList testing,
TransducerEvaluator eval,
int numIterations)
|
boolean |
train(InstanceList training,
InstanceList validation,
InstanceList testing,
TransducerEvaluator eval,
int numIterations,
int numIterationsPerProportion,
double[] trainingProportions)
|
boolean |
trainWithFeatureInduction(InstanceList trainingData,
InstanceList validationData,
InstanceList testingData,
TransducerEvaluator eval,
int numIterations,
int numIterationsBetweenFeatureInductions,
int numFeatureInductions,
int numFeaturesPerFeatureInduction,
double trueLabelProbThreshold,
boolean clusteredFeatureInduction,
double[] trainingProportions)
|
boolean |
trainWithFeatureInduction(InstanceList trainingData,
InstanceList validationData,
InstanceList testingData,
TransducerEvaluator eval,
int numIterations,
int numIterationsBetweenFeatureInductions,
int numFeatureInductions,
int numFeaturesPerFeatureInduction,
double trueLabelProbThreshold,
boolean clusteredFeatureInduction,
double[] trainingProportions,
java.lang.String gainName)
|
Sequence |
transduce(java.lang.Object unpipedInput)
|
Sequence |
transduce(Sequence input)
Converts the given sequence into another sequence according to this transducer. |
void |
unfreezeWeights(java.lang.String weightsName)
Unfreezes a set of weights. |
Transducer.ViterbiPath |
viterbiPath(Sequence inputSequence,
boolean keepLattice)
|
void |
write(java.io.File f)
|
Methods inherited from class java.lang.Object |
clone, equals, finalize, getClass, hashCode, notify, notifyAll, toString, wait, wait, wait |
Field Detail |
protected boolean someTrainingDone
public boolean printGradient
public static final int VITERBI
public static final int VITERBI_FBEAM
public static final int VITERBI_BBEAM
public static final int VITERBI_FBBEAM
public static final int VITERBI_FBEAMKL
Constructor Detail |
public CRF4(Pipe inputPipe, Pipe outputPipe)
public CRF4(Alphabet inputAlphabet, Alphabet outputAlphabet)
public CRF4(CRF4 other)
Method Detail |
public Alphabet getInputAlphabet()
public Alphabet getOutputAlphabet()
public void setUseHyperbolicPrior(boolean f)
public void setHyperbolicPriorSlope(double p)
public void setHyperbolicPriorSharpness(double p)
public double getUseHyperbolicPriorSlope()
public double getUseHyperbolicPriorSharpness()
public void setGaussianPriorVariance(double p)
public double getGaussianPriorVariance()
public void setUseSparseWeights(boolean b)
public boolean getUseSparseWeights()
public void setUseSomeUnsupportedTrick(boolean b)
This generally leads to better accuracy at only a small memory cost.
b
- Whether to use the trickpublic int getTransductionType()
public void setTransductionType(int transductionType)
protected CRF4.State newState(java.lang.String name, int index, double initialCost, double finalCost, java.lang.String[] destinationNames, java.lang.String[] labelNames, java.lang.String[][] weightNames, CRF4 crf)
public void addState(java.lang.String name, double initialCost, double finalCost, java.lang.String[] destinationNames, java.lang.String[] labelNames, java.lang.String[][] weightNames)
public void addState(java.lang.String name, double initialCost, double finalCost, java.lang.String[] destinationNames, java.lang.String[] labelNames, java.lang.String[] weightNames)
public void addState(java.lang.String name, double initialCost, double finalCost, java.lang.String[] destinationNames, java.lang.String[] labelNames)
public void addState(java.lang.String name, java.lang.String[] destinationNames)
public void addFullyConnectedStates(java.lang.String[] stateNames)
public void addFullyConnectedStatesForLabels()
public void addStartState()
public void addStartState(java.lang.String name)
public void setAsStartState(CRF4.State state)
public void addStatesForLabelsConnectedAsIn(InstanceList trainingSet)
public void addStatesForHalfLabelsConnectedAsIn(InstanceList trainingSet)
public void addStatesForThreeQuarterLabelsConnectedAsIn(InstanceList trainingSet)
public void addFullyConnectedStatesForThreeQuarterLabels(InstanceList trainingSet)
public void addFullyConnectedStatesForBiLabels()
public void addStatesForBiLabelsConnectedAsIn(InstanceList trainingSet)
public void addFullyConnectedStatesForTriLabels()
public void addSelfTransitioningStateForAllLabels(java.lang.String name)
public java.lang.String addOrderNStates(InstanceList trainingSet, int[] orders, boolean[] defaults, java.lang.String start, java.util.regex.Pattern forbidden, java.util.regex.Pattern allowed, boolean fullyConnected)
String
s. Creates an order-n CRF with input
predicates and output labels given by trainingSet
and order, connectivity, and weights given by the remaining
arguments.
trainingSet
- the training instancesorders
- an array of increasing non-negative numbers giving
the orders of the features for this CRF. The largest number
n is the Markov order of the CRF. States are
n-tuples of output labels. Each of the other numbers
k in orders
represents a weight set shared
by all destination states whose last (most recent) k
labels agree. If orders
is null
, an
order-0 CRF is built.defaults
- If non-null, it must be the same length as
orders
, with true
positions indicating
that the weight set for the corresponding order contains only the
weight for a default feature; otherwise, the weight set has
weights for all features built from input predicates.start
- The label that represents the context of the start of
a sequence. It may be also used for sequence labels. If no label of
this name exists, one will be added. Connection wills be added between
the start label and all other labels, even if fullyConnected is
false. This argument may be null, in which case no special
start state is added.forbidden
- If non-null, specifies what pairs of successive
labels are not allowed, both for constructing norder
states or for transitions. A label pair (u,v)
is not allowed if u + "," + v matches
forbidden
.allowed
- If non-null, specifies what pairs of successive
labels are allowed, both for constructing norder
states or for transitions. A label pair (u,v)
is allowed only if u + "," + v matches
allowed
.fullyConnected
- Whether to include all allowed transitions,
even those not occurring in trainingSet
,
public CRF4.State getState(java.lang.String name)
public void setWeights(int weightsIndex, SparseVector transitionWeights)
public void setWeights(java.lang.String weightName, SparseVector transitionWeights)
public java.lang.String getWeightsName(int weightIndex)
public SparseVector getWeights(java.lang.String weightName)
public SparseVector getWeights(int weightIndex)
public double[] getDefaultWeights()
public SparseVector[] getWeights()
public void setWeights(SparseVector[] m)
public void setDefaultWeights(double[] w)
public void setDefaultWeight(int widx, double val)
public void freezeWeights(int weightsIndex)
weightsIndex
- Index of weight set to freeze.public void freezeWeights(java.lang.String weightsName)
weightsName
- Name of weight set to freeze.public void unfreezeWeights(java.lang.String weightsName)
weightsName
- Name of weight set to unfreeze.public void setFeatureSelection(int weightIdx, FeatureSelection fs)
public void setWeightsDimensionAsIn(InstanceList trainingData)
public void setWeightsDimensionDensely()
public int getWeightsIndex(java.lang.String weightName)
public int numStates()
numStates
in class Transducer
public Transducer.State getState(int index)
getState
in class Transducer
public java.util.Iterator initialStateIterator()
initialStateIterator
in class Transducer
public boolean isTrainable()
isTrainable
in class Transducer
public void setTrainable(boolean f)
setTrainable
in class Transducer
public double getParametersAbsNorm()
public void setParameter(int sourceStateIndex, int destStateIndex, int featureIndex, double value)
public double getParameter(int sourceStateIndex, int destStateIndex, int featureIndex, double value)
public void reset()
public void estimate()
public Sequence transduce(java.lang.Object unpipedInput)
public Sequence transduce(Sequence input)
Transducer
transduce
in class Transducer
input
- Input sequence
public void print()
print
in class Transducer
public void print(java.io.PrintWriter out)
public boolean train(InstanceList ilist)
train
in class Transducer
public boolean train(InstanceList ilist, InstanceList validation, InstanceList testing)
public boolean train(InstanceList ilist, InstanceList validation, InstanceList testing, TransducerEvaluator eval)
public boolean train(InstanceList ilist, InstanceList validation, InstanceList testing, TransducerEvaluator eval, int numIterations)
public boolean train(InstanceList training, InstanceList validation, InstanceList testing, TransducerEvaluator eval, int numIterations, int numIterationsPerProportion, double[] trainingProportions)
public boolean trainWithFeatureInduction(InstanceList trainingData, InstanceList validationData, InstanceList testingData, TransducerEvaluator eval, int numIterations, int numIterationsBetweenFeatureInductions, int numFeatureInductions, int numFeaturesPerFeatureInduction, double trueLabelProbThreshold, boolean clusteredFeatureInduction, double[] trainingProportions)
public boolean trainWithFeatureInduction(InstanceList trainingData, InstanceList validationData, InstanceList testingData, TransducerEvaluator eval, int numIterations, int numIterationsBetweenFeatureInductions, int numFeatureInductions, int numFeaturesPerFeatureInduction, double trueLabelProbThreshold, boolean clusteredFeatureInduction, double[] trainingProportions, java.lang.String gainName)
public Sequence[] predict(InstanceList testing)
public void evaluate(TransducerEvaluator eval, InstanceList testing)
public void write(java.io.File f)
public CRF4.MaximizableCRF getMaximizableCRF(InstanceList ilist)
public Transducer.ViterbiPath viterbiPath(Sequence inputSequence, boolean keepLattice)
|
||||||||||
PREV CLASS NEXT CLASS | FRAMES NO FRAMES | |||||||||
SUMMARY: NESTED | FIELD | CONSTR | METHOD | DETAIL: FIELD | CONSTR | METHOD |