Acoustic Model Discussions

Flat
Problems with Voxforge Acoustic Model
User: e.fields
Date: 12/15/2012 12:33 pm
Views: 13364
Rating: 13

I've downloaded the Spanish Voxforge Acoustic Model and I'm trying to use it with the test language model that came with it. However, I keep receiving the following errors:

12:27:52.901 SEVERE lexTreeLinguist Bad HMM Unit: V

12:27:52.909 SEVERE HMMTree Missing HMM for unit E with lc=V rc=R

12:27:52.909 SEVERE lexTreeLinguist Bad HMM Unit: V

12:27:52.909 SEVERE HMMTree Missing HMM for unit N with lc=O rc=V

12:27:52.909 SEVERE lexTreeLinguist Bad HMM Unit: V

12:27:52.909 SEVERE HMMTree Missing HMM for unit V with lc=N rc=E

 

 

I receive dozens of errors like this. Is the problem with my config.xml file? I've pasted it below for viewing:

 

<?xml version="1.0" encoding="UTF-8"?>

<!-- ************************************************** -->
<!-- Sphinx-4 Configuration File                        -->
<!-- ************************************************** -->


<config>
    
    <!-- ************************************************** -->
    <!-- Global Properties                                  -->
    <!-- ************************************************** -->
    
    <property name="absoluteBeamWidth" value="5000"/>
    <property name="relativeBeamWidth" value="1E-120"/>
    <property name="absoluteWordBeamWidth" value="200"/>
    <property name="relativeWordBeamWidth" value="1E-80"/>
    <property name="wordInsertionProbability" value="0.7"/>
    <property name="languageWeight" value="10.5"/>
    <property name="silenceInsertionProbability" value=".1"/>
    <property name="fillerInsertionProbability" value="1e-6"/>
    <property name="acousticLookahead" value="1.7"/>
    <property name="lookaheadBeam" value="1e-80"/>
    <property name="frontend" value="mfcFrontEnd"/>
    <property name="recognizer" value="recognizer"/>
    
    <!-- ************************************************** -->
    <!-- Components                                         -->
    <!-- ************************************************** -->
    
    <component name="batch"
        type="edu.cmu.sphinx.tools.batch.BatchModeRecognizer">
        <propertylist name="inputDataProcessors">
            <item>streamDataSource</item>
        </propertylist>
        <property name="skip" value="0"/>
        <property name="recognizer" value="${recognizer}"/>
    </component>
    
    <component name="recognizer"
        type="edu.cmu.sphinx.recognizer.Recognizer">
        <propertylist name="monitors">
            <item>accuracyTracker</item>
            <item>speedTracker</item>
            <item>memoryTracker</item>
        </propertylist>
        <property name="decoder" value="decoder"/>
    </component>
    
    <component name="decoder"
        type="edu.cmu.sphinx.decoder.Decoder">
        <property name="searchManager" value="wordPruningSearchManager"/>
    </component>
    
    <component name="wordPruningSearchManager"
        type="edu.cmu.sphinx.decoder.search.WordPruningBreadthFirstSearchManager">
        <property name="scorer" value="threadedScorer"/>
        <property name="pruner" value="trivialPruner"/>
        <property name="activeListManager" value="activeListManager"/>
        <property name="logMath" value="logMath"/>
        
        <property name="buildWordLattice" value="false"/>
        <property name="growSkipInterval" value="0"/>
        <property name="linguist" value="lexTreeLinguist"/>
        <property name="checkStateOrder" value="false"/>
        
        <property name="acousticLookaheadFrames" value="${acousticLookahead}"/>
        <property name="relativeBeamWidth" value="${lookaheadBeam}"/>
    </component>
    
    <component name="activeListManager"
        type="edu.cmu.sphinx.decoder.search.SimpleActiveListManager">
        <propertylist name="activeListFactories">
            <item>unitExitActiveList</item>
            <item>wordActiveList</item>
            <item>wordActiveList</item>
            <item>activeList</item>
            <item>activeList</item>
            <item>activeList</item>
        </propertylist>
    </component>
    
    <component name="unitExitActiveList"
        type="edu.cmu.sphinx.decoder.search.PartitionActiveListFactory">
        <property name="logMath" value="logMath"/>
        <property name="absoluteBeamWidth" value="${absoluteBeamWidth}"/>
        <property name="relativeBeamWidth" value="${relativeBeamWidth}"/>
    </component>
    
    <component name="wordActiveList"
        type="edu.cmu.sphinx.decoder.search.PartitionActiveListFactory">
        <property name="logMath" value="logMath"/>
        <property name="absoluteBeamWidth" value="${absoluteWordBeamWidth}"/>
        <property name="relativeBeamWidth" value="${relativeWordBeamWidth}"/>
    </component>
    
    <component name="activeList"
        type="edu.cmu.sphinx.decoder.search.PartitionActiveListFactory">
        <property name="logMath" value="logMath"/>
        <property name="absoluteBeamWidth" value="${absoluteBeamWidth}"/>
        <property name="relativeBeamWidth" value="${relativeBeamWidth}"/>
    </component>
    
    <component name="lexTreeLinguist"
        type="edu.cmu.sphinx.linguist.lextree.LexTreeLinguist">
        <property name="logMath" value="logMath"/>
        <property name="dictionary" value="dictionary"/>
        <property name="addFillerWords" value="false"/>
        <property name="acousticModel" value="voxforge"/>
        <property name="languageModel" value="trigramModel"/>
        <property name="unitManager" value="unitManager"/>
    
        <property name="languageWeight" value="${languageWeight}"/>
        <property name="silenceInsertionProbability" value="${silenceInsertionProbability}"/>
        <property name="wordInsertionProbability" value="${wordInsertionProbability}"/>
        <property name="fillerInsertionProbability" value="${fillerInsertionProbability}"/>
        
        <property name="wantUnigramSmear" value="true"/>
        <property name="unigramSmearWeight" value="1"/>
        <property name="cacheSize" value="0"/>
    </component>
    
    <component name="trigramModel"
        type="edu.cmu.sphinx.linguist.language.ngram.SimpleNGramModel">
        <property name="unigramWeight" value=".7"/>
        <property name="maxDepth" value="2"/>
        <property name="logMath" value="logMath"/>
        <property name="dictionary" value="dictionary"/>
        <property name="location"
        value="/Users/Eric/Documents/Research/Sphinx4/bld/voxforge-es-0.1.1/etc/voxforge_es_sphinx.transcription.test.lm" />
    </component>
    
    <component name="dictionary"
        type="edu.cmu.sphinx.linguist.dictionary.FullDictionary">
        <property name="dictionaryPath" value="/Users/Eric/Documents/Research/Sphinx4/bld/voxforge-es-0.1.1/etc/voxforge_es_sphinx_MX.dic"/>
        <property name="fillerPath" value="/Users/Eric/Documents/Research/Sphinx4/bld/voxforge-es-0.1.1/etc/voxforge_es_sphinx.filler"/>
        <property name="unitManager" value="unitManager"/>
    </component>
    
    <component name="voxforge"
        type="edu.cmu.sphinx.linguist.acoustic.tiedstate.TiedStateAcousticModel">
        <property name="loader" value="modelLoader"/>
        <property name="unitManager" value="unitManager"/>
    </component>
    
    <component name="modelLoader" type="edu.cmu.sphinx.linguist.acoustic.tiedstate.Sphinx3Loader">
        <property name="logMath" value="logMath"/>
        <property name="unitManager" value="unitManager"/>
        <property name="location" value="/Users/Eric/Documents/Research/Sphinx4/bld/voxforge-es-0.1.1/model_parameters/voxforge_es_sphinx.cd_cont_1500"/>
        <property name="vectorLength" value="29"/>
    </component>
    
    <component name="trivialPruner"
        type="edu.cmu.sphinx.decoder.pruner.SimplePruner">
    </component>
    
    <component name="threadedScorer"
        type="edu.cmu.sphinx.decoder.scorer.ThreadedAcousticScorer">
        <property name="frontend" value="${frontend}"/>
    </component>
    
    <component name="logMath"
        type="edu.cmu.sphinx.util.LogMath">
        <property name="logBase" value="1.0001"/>
        <property name="useAddTable" value="true"/>
    </component>
    
    <component name="unitManager"
    type="edu.cmu.sphinx.linguist.acoustic.UnitManager"/>
    
    <component name="mfcFrontEnd"
        type="edu.cmu.sphinx.frontend.FrontEnd">
        <propertylist name="pipeline">
            <item>audioFileDataSource</item>
            <item>dataBlocker </item>
            <item>speechClassifier </item>
            <item>speechMarker </item>
            <item>nonSpeechDataFilter </item>
            <item>dither</item>
            <item>preemphasizer</item>
            <item>windower</item>
            <item>fft</item>
            <item>melFilterBank</item>
            <item>dct</item>
            <item>liveCMN </item>
            <item>featureExtraction</item>
            <item>featureTransform</item>
        </propertylist>
    </component>
    
    <component name="audioFileDataSource" type="edu.cmu.sphinx.frontend.util.AudioFileDataSource"/>   
    <component name="dataBlocker" type="edu.cmu.sphinx.frontend.DataBlocker"/>
    
    <component name="microphone"
        type="edu.cmu.sphinx.frontend.util.Microphone">
        <property name="closeBetweenUtterances" value="false"/>
    </component>
    
    <component name="speechClassifier"
        type="edu.cmu.sphinx.frontend.endpoint.SpeechClassifier">
        <property name="threshold" value="13"/>
    </component>
    
    <component name="nonSpeechDataFilter"
    type="edu.cmu.sphinx.frontend.endpoint.NonSpeechDataFilter"/>
    
    <component name="speechMarker"
        type="edu.cmu.sphinx.frontend.endpoint.SpeechMarker">
        <property name="speechTrailer" value="50"/>
    </component>

    
    <component name="preemphasizer"
        type="edu.cmu.sphinx.frontend.filter.Preemphasizer">
    </component>
    
    <component name="dither"
        type="edu.cmu.sphinx.frontend.filter.Dither">
    </component>
    
    <component name="windower"
        type="edu.cmu.sphinx.frontend.window.RaisedCosineWindower">
    </component>
    
    <component name="fft"
        type="edu.cmu.sphinx.frontend.transform.DiscreteFourierTransform">
    </component>
    
    <component name="melFilterBank"
        type="edu.cmu.sphinx.frontend.frequencywarp.MelFrequencyFilterBank">
        <property name="numberFilters" value="32"/>
        <property name="minimumFrequency" value="200"/>
        <property name="maximumFrequency" value="3500"/>
    </component>
    
    <component name="dct"
        type="edu.cmu.sphinx.frontend.transform.DiscreteCosineTransform">
    </component>
    
    <component name="liveCMN"
        type="edu.cmu.sphinx.frontend.feature.LiveCMN" />
    
    <component name="featureExtraction"
        type="edu.cmu.sphinx.frontend.feature.DeltasFeatureExtractor">
    </component>
    
    <component name="featureTransform"
        type="edu.cmu.sphinx.frontend.feature.FeatureTransform">
        <property name="loader" value="modelLoader"/>
    </component>
    
    <!-- ************************************************** -->
    <!-- Instrumentation                                    -->
    <!-- ************************************************** -->
    
    <component name="accuracyTracker"
        type="edu.cmu.sphinx.instrumentation.BestPathAccuracyTracker">
        <property name="showRawResults" value="false"/>
        <property name="recognizer" value="${recognizer}"/>
        <property name="showAlignedResults" value="false"/>
    </component>
    
    <component name="speedTracker"
        type="edu.cmu.sphinx.instrumentation.SpeedTracker">
        <property name="showTimers" value="true"/>
        <property name="frontend" value="${frontend}"/>
        <property name="recognizer" value="${recognizer}"/>
    </component>
    
    <component name="recognizerMonitor"
        type="edu.cmu.sphinx.instrumentation.RecognizerMonitor">
        <property name="recognizer" value="${recognizer}"/>
        <propertylist name="allocatedMonitors">
            <item>configMonitor </item>
        </propertylist>
    </component>
    
    <component name="memoryTracker"
        type="edu.cmu.sphinx.instrumentation.MemoryTracker">
        <property name="recognizer" value="${recognizer}"/>
    </component>
    
    <component name="configMonitor"
        type="edu.cmu.sphinx.instrumentation.ConfigMonitor">
        <property name="showConfig" value="false"/>
    </component>
    
</config>

--- (Edited on 12/15/2012 12:38 pm [GMT-0600] by e.fields) ---

Re: Problems with Voxforge Acoustic Model
User: nsh
Date: 12/15/2012 2:58 pm
Views: 2699
Rating: 10

You already asked this question here:

http://www.voxforge.org/home/forums/other-languages-forums/spanish/language-model-for-voxforge-spanish-acoustic-model

--- (Edited on 12/15/2012 23:58 [GMT+0300] by nsh) ---

PreviousNext