pub enum Variable {
Show 634 variants
ClassifyNumCpLevels,
TextordDotmatrixGap,
TextordDebugBlock,
TextordPitchRange,
TextordWordsVetoPower,
TextordTabfindShowStrokewidths,
PitsyncLinearVersion,
PitsyncFakeDepth,
OldblHoledLosscount,
TextordSkewsmoothOffset,
TextordSkewsmoothOffset2,
TextordTestX,
TextordTestY,
TextordMinBlobsInRow,
TextordSplineMinblobs,
TextordSplineMedianwin,
TextordMaxBlobOverlaps,
TextordMinXheight,
TextordLmsLineTrials,
TextordTabfindShowImages,
TextordFpChopError,
EdgesMaxChildrenPerOutline,
EdgesMaxChildrenLayers,
EdgesChildrenPerGrandchild,
EdgesChildrenCountLimit,
EdgesMinNonhole,
EdgesPathareaRatio,
DevanagariSplitDebuglevel,
TextordTabfindShowPartitions,
TextordDebugTabfind,
TextordDebugBugs,
TextordTestregionLeft,
TextordTestregionTop,
TextordTestregionRight,
TextordTestregionBottom,
EditorImageXpos,
EditorImageYpos,
EditorImageMenuheight,
EditorImageWordBbColor,
EditorImageBlobBbColor,
EditorImageTextColor,
EditorDbwinXpos,
EditorDbwinYpos,
EditorDbwinHeight,
EditorDbwinWidth,
EditorWordXpos,
EditorWordYpos,
EditorWordHeight,
EditorWordWidth,
WordrecDisplaySplits,
PolyDebug,
PolyWideObjectsBetter,
WordrecDisplayAllBlobs,
WordrecBlobPause,
TextordFpChopping,
TextordForceMakePropWords,
TextordChopperTest,
TextordRestoreUnderlines,
TextordShowInitialWords,
TextordShowNewWords,
TextordShowFixedWords,
TextordBlocksallFixed,
TextordBlocksallProp,
TextordBlocksallTesting,
TextordTestMode,
TextordPitchScalebigwords,
TextordAllProp,
TextordDebugPitchTest,
TextordDisablePitchTest,
TextordFastPitchTest,
TextordDebugPitchMetric,
TextordShowRowCuts,
TextordShowPageCuts,
TextordPitchCheat,
TextordBlockndocFixed,
TextordShowTables,
TextordTablefindShowMark,
TextordTablefindShowStats,
TextordTablefindRecognizeTables,
TextordTabfindShowInitialtabs,
TextordTabfindShowFinaltabs,
TextordTabfindOnlyStrokewidths,
TextordReallyOldXheight,
TextordOldblDebug,
TextordDebugBaselines,
TextordOldblParadef,
TextordOldblSplitSplines,
TextordOldblMergeParts,
OldblCorrfix,
OldblXhfix,
TextordOcropusMode,
TextordHeavyNr,
TextordShowInitialRows,
TextordShowParallelRows,
TextordShowExpandedRows,
TextordShowFinalRows,
TextordShowFinalBlobs,
TextordTestLandscape,
TextordParallelBaselines,
TextordStraightBaselines,
TextordOldBaselines,
TextordOldXheight,
TextordFixXheightBug,
TextordFixMakerowBug,
TextordDebugXheights,
TextordBiasedSkewcalc,
TextordInterpolatingSkew,
TextordNewInitialXheight,
TextordDebugBlob,
GapmapDebug,
GapmapUseEnds,
GapmapNoIsolatedQuanta,
EdgesUseNewOutlineComplexity,
EdgesDebug,
EdgesChildrenFix,
TextordShowFixedCuts,
DevanagariSplitDebugimage,
TextordTabfindShowInitialPartitions,
TextordTabfindShowRejectBlobs,
TextordTabfindShowColumns,
TextordTabfindShowBlocks,
TextordTabfindFindTables,
TextordSpaceSizeIsVariable,
TextordDebugPrintable,
EquationdetectSaveBiImage,
EquationdetectSaveSptImage,
EquationdetectSaveSeedImage,
EquationdetectSaveMergedImage,
StreamFilelist,
DebugFile,
Dotproduct,
ClassifyFontName,
FxDebugfile,
EditorImageWinName,
EditorDbwinName,
EditorWordName,
DocumentTitle,
ClassifyPicoFeatureLength,
ClassifyNormAdjMidpoint,
ClassifyNormAdjCurl,
ClassifyMinSlope,
ClassifyMaxSlope,
ClassifyCpAnglePadLoose,
ClassifyCpAnglePadMedium,
ClassifyCpAnglePadTight,
ClassifyCpEndPadLoose,
ClassifyCpEndPadMedium,
ClassifyCpEndPadTight,
ClassifyCpSidePadLoose,
ClassifyCpSidePadMedium,
ClassifyCpSidePadTight,
ClassifyPpAnglePad,
ClassifyPpEndPad,
ClassifyPpSidePad,
TextordUnderlineOffset,
TextordWordstatsSmoothFactor,
TextordWidthSmoothFactor,
TextordWordsWidthIle,
TextordWordsMaxspace,
TextordWordsDefaultMaxspace,
TextordWordsDefaultMinspace,
TextordWordsMinMinspace,
TextordWordsDefaultNonspace,
TextordWordsInitialLower,
TextordWordsInitialUpper,
TextordWordsMinlarge,
TextordWordsPitchsdThreshold,
TextordWordsDefFixed,
TextordWordsDefProp,
TextordPitchRowsimilarity,
WordsInitialLower,
WordsInitialUpper,
WordsDefaultPropNonspace,
WordsDefaultFixedSpace,
WordsDefaultFixedLimit,
TextordWordsDefiniteSpread,
TextordSpacesizeRatiofp,
TextordSpacesizeRatioprop,
TextordFpiqrRatio,
TextordMaxPitchIqr,
TextordFpMinWidth,
TextordProjectionScale,
TextordBalanceFactor,
TextordTabvectorVerticalGapFraction,
TextordTabvectorVerticalBoxRatio,
PitsyncJoinedEdge,
PitsyncOffsetFreecutFraction,
OldblXhfract,
OldblDotErrorSize,
TextordOldblJumplimit,
TextordSplineShiftFraction,
TextordSplineOutlierFraction,
TextordSkewIle,
TextordSkewLag,
TextordLinespaceIqrlimit,
TextordWidthLimit,
TextordChopWidth,
TextordExpansionFactor,
TextordOverlapX,
TextordMinxh,
TextordMinLinesize,
TextordExcessBlobsize,
TextordOccupancyThreshold,
TextordUnderlineWidth,
TextordMinBlobHeightFraction,
TextordXheightModeFraction,
TextordAscheightModeFraction,
TextordDescheightModeFraction,
TextordAscxRatioMin,
TextordAscxRatioMax,
TextordDescxRatioMin,
TextordDescxRatioMax,
TextordXheightErrorMargin,
GapmapBigGaps,
TextordFpChopSnap,
EdgesChildarea,
EdgesBoxarea,
TextordUnderlineThreshold,
AmbigsDebugLevel,
ClassifyDebugLevel,
ClassifyNormMethod,
MatcherDebugLevel,
MatcherDebugFlags,
ClassifyLearningDebugLevel,
MatcherPermanentClassesMin,
MatcherMinExamplesForPrototyping,
MatcherSufficientExamplesForPrototyping,
ClassifyAdaptProtoThreshold,
ClassifyAdaptFeatureThreshold,
ClassifyClassPrunerThreshold,
ClassifyClassPrunerMultiplier,
ClassifyCpCutoffStrength,
ClassifyIntegerMatcherMultiplier,
DawgDebugLevel,
HyphenDebugLevel,
StopperSmallwordSize,
StopperDebugLevel,
TesseditTruncateWordchoiceLog,
MaxPermuterAttempts,
RepairUnchoppedBlobs,
ChopDebug,
ChopSplitLength,
ChopSameDistance,
ChopMinOutlinePoints,
ChopSeamPileSize,
ChopInsideAngle,
ChopMinOutlineArea,
ChopCenteredMaxwidth,
ChopXyWeight,
WordrecDebugLevel,
WordrecMaxJoinChunks,
SegsearchDebugLevel,
SegsearchMaxPainPoints,
SegsearchMaxFutileClassifications,
LanguageModelDebugLevel,
LanguageModelNgramOrder,
LanguageModelViterbiListMaxNumPrunable,
LanguageModelViterbiListMaxSize,
LanguageModelMinCompoundLength,
WordrecDisplaySegmentations,
TesseditPagesegMode,
TesseditOcrEngineMode,
PagesegDevanagariSplitStrategy,
OcrDevanagariSplitStrategy,
BidiDebug,
ApplyboxDebug,
ApplyboxPage,
TesseditBigramDebug,
DebugNoiseRemoval,
NoiseMaxperblob,
NoiseMaxperword,
DebugXHtLevel,
QualityMinInitialAlphasReqd,
TesseditTessAdaptionMode,
MultilangDebugLevel,
ParagraphDebugLevel,
TesseditPreserveMinWdLen,
CrunchRatingMax,
CrunchPotIndicators,
CrunchLeaveLcStrings,
CrunchLeaveUcStrings,
CrunchLongRepetitions,
CrunchDebug,
FixspNonNoiseLimit,
FixspDoneMode,
DebugFixSpaceLevel,
XHtAcceptanceTolerance,
XHtMinChange,
SuperscriptDebug,
JpgQuality,
UserDefinedDpi,
MinCharactersToTry,
SuspectLevel,
SuspectShortWords,
TesseditRejectMode,
TesseditImageBorder,
MinSaneXHtPixels,
TesseditPageNumber,
TesseditParallelize,
LstmChoiceMode,
TospDebugLevel,
TospEnoughSpaceSamplesForMedian,
TospRedoKernLimit,
TospFewSamples,
TospShortRow,
TospSanityMethod,
TextordMaxNoiseSize,
TextordBaselineDebug,
TextordNoiseSizefraction,
TextordNoiseTranslimit,
TextordNoiseSncount,
UseAmbigsForAdaption,
AllowBlobDivision,
PrioritizeDivision,
ClassifyEnableLearning,
TessCnMatching,
TessBnMatching,
ClassifyEnableAdaptiveMatcher,
ClassifyUsePreAdaptedTemplates,
ClassifySaveAdaptedTemplates,
ClassifyEnableAdaptiveDebugger,
ClassifyNonlinearNorm,
DisableCharacterFragments,
ClassifyDebugCharacterFragments,
MatcherDebugSeparateWindows,
ClassifyBlnNumericMode,
LoadSystemDawg,
LoadFreqDawg,
LoadUnambigDawg,
LoadPuncDawg,
LoadNumberDawg,
LoadBigramDawg,
UseOnlyFirstUft8Step,
StopperNoAcceptableChoices,
SegmentNonalphabeticScript,
SaveDocWords,
MergeFragmentsInMatrix,
WordrecEnableAssoc,
ForceWordAssoc,
ChopEnable,
ChopVerticalCreep,
ChopNewSeamPile,
AssumeFixedPitchCharSegment,
WordrecSkipNoTruthWords,
WordrecDebugBlamer,
WordrecRunBlamer,
SaveAltChoices,
LanguageModelNgramOn,
LanguageModelNgramUseOnlyFirstUft8Step,
LanguageModelNgramSpaceDelimitedLanguage,
LanguageModelUseSigmoidalCertainty,
TesseditResegmentFromBoxes,
TesseditResegmentFromLineBoxes,
TesseditTrainFromBoxes,
TesseditMakeBoxesFromBoxes,
TesseditTrainLineRecognizer,
TesseditDumpPagesegImages,
TesseditDoInvert,
TesseditAmbigsTraining,
TesseditAdaptionDebug,
ApplyboxLearnCharsAndCharFragsMode,
ApplyboxLearnNgramsMode,
TesseditDisplayOutwords,
TesseditDumpChoices,
TesseditTimingDebug,
TesseditFixFuzzySpaces,
TesseditUnrejAnyWd,
TesseditFixHyphens,
TesseditEnableDocDict,
TesseditDebugFonts,
TesseditDebugBlockRejection,
TesseditEnableBigramCorrection,
TesseditEnableDictCorrection,
EnableNoiseRemoval,
TesseditMinimalRejPass1,
TesseditTestAdaption,
TestPt,
ParagraphTextBased,
LstmUseMatrix,
TesseditGoodQualityUnrej,
TesseditUseRejectSpaces,
TesseditPreserveBlkRejPerfectWds,
TesseditPreserveRowRejPerfectWds,
TesseditDontBlkrejGoodWds,
TesseditDontRowrejGoodWds,
TesseditRowRejGoodDocs,
TesseditRejectBadQualWds,
TesseditDebugDocRejection,
TesseditDebugQualityMetrics,
BlandUnrej,
UnlvTildeCrunching,
HocrFontInfo,
HocrCharBoxes,
CrunchEarlyMergeTessFails,
CrunchEarlyConvertBadUnlvChs,
CrunchTerribleGarbage,
CrunchLeaveOkStrings,
CrunchAcceptOk,
CrunchLeaveAcceptStrings,
CrunchIncludeNumerals,
TesseditPreferJoinedPunct,
TesseditWriteBlockSeparators,
TesseditWriteRepCodes,
TesseditWriteUnlv,
TesseditCreateTxt,
TesseditCreateHocr,
TesseditCreateAlto,
TesseditCreateLstmbox,
TesseditCreateTsv,
TesseditCreateWordstrbox,
TesseditCreatePdf,
TextonlyPdf,
SuspectConstrain1Il,
TesseditMinimalRejection,
TesseditZeroRejection,
TesseditWordForWord,
TesseditZeroKelvinRejection,
TesseditRejectionDebug,
TesseditFlip0O,
RejTrustDocDawg,
Rej1IlUseDictWord,
Rej1IlTrustPermuterType,
RejUseTessAccepted,
RejUseTessBlanks,
RejUseGoodPerm,
RejUseSensibleWd,
RejAlphasInNumberPerm,
TesseditCreateBoxfile,
TesseditWriteImages,
InteractiveDisplayMode,
TesseditOverridePermuter,
TesseditUsePrimaryParamsModel,
TextordTabfindShowVlines,
TextordUseCjkFpModel,
PolyAllowDetailedFx,
TesseditInitConfigOnly,
TextordEquationDetect,
TextordTabfindVerticalText,
TextordTabfindForceVerticalText,
PreserveInterwordSpaces,
PagesegApplyMusicMask,
TextordSingleHeightMode,
TospOldToMethod,
TospOldToConstrainSpKn,
TospOnlyUsePropRows,
TospForceWordbreakOnPunct,
TospUsePreChopping,
TospOldToBugFix,
TospBlockUseCertSpaces,
TospRowUseCertSpaces,
TospNarrowBlobsNotCert,
TospRowUseCertSpaces1,
TospRecoveryIsolatedRowStats,
TospOnlySmallGapsForKern,
TospAllFlipsFuzzy,
TospFuzzyLimitAll,
TospStatsUseXhtGaps,
TospUseXhtGaps,
TospOnlyUseXhtGaps,
TospRule9TestPunct,
TospFlipFuzzKnToSp,
TospFlipFuzzSpToKn,
TospImproveThresh,
TextordNoRejects,
TextordShowBlobs,
TextordShowBoxes,
TextordNoiseRejwords,
TextordNoiseRejrows,
TextordNoiseDebug,
ClassifyLearnDebugStr,
UserWordsFile,
UserWordsSuffix,
UserPatternsFile,
UserPatternsSuffix,
OutputAmbigWordsFile,
WordToDebug,
TesseditCharBlacklist,
TesseditCharWhitelist,
TesseditCharUnblacklist,
TesseditWriteParamsToFile,
ApplyboxExposurePattern,
ChsLeadingPunct,
ChsTrailingPunct1,
ChsTrailingPunct2,
OutlinesOdd,
Outlines2,
NumericPunctuation,
UnrecognisedChar,
OkRepeatedChNonAlphanumWds,
ConflictSetIl1,
FileType,
TesseditLoadSublangs,
PageSeparator,
ClassifyCharNormRange,
ClassifyMaxRatingRatio,
ClassifyMaxCertaintyMargin,
MatcherGoodThreshold,
MatcherReliableAdaptiveResult,
MatcherPerfectThreshold,
MatcherBadMatchPad,
MatcherRatingMargin,
MatcherAvgNoiseSize,
MatcherClusteringMaxAngleDelta,
ClassifyMisfitJunkPenalty,
RatingScale,
CertaintyScale,
TesseditClassMissScale,
ClassifyAdaptedPruningFactor,
ClassifyAdaptedPruningThreshold,
ClassifyCharacterFragmentsGarbageCertaintyThreshold,
SpeckleLargeMaxSize,
SpeckleRatingPenalty,
XheightPenaltySubscripts,
XheightPenaltyInconsistent,
SegmentPenaltyDictFrequentWord,
SegmentPenaltyDictCaseOk,
SegmentPenaltyDictCaseBad,
SegmentPenaltyDictNonword,
SegmentPenaltyGarbage,
StopperNondictCertaintyBase,
StopperPhase2CertaintyRejectionOffset,
StopperCertaintyPerChar,
StopperAllowableCharacterBadness,
DocDictPendingThreshold,
DocDictCertaintyThreshold,
TesseditCertaintyThreshold,
ChopSplitDistKnob,
ChopOverlapKnob,
ChopCenterKnob,
ChopSharpnessKnob,
ChopWidthChangeKnob,
ChopOkSplit,
ChopGoodSplit,
SegsearchMaxCharWhRatio,
LanguageModelNgramSmallProb,
LanguageModelNgramNonmatchScore,
LanguageModelNgramScaleFactor,
LanguageModelNgramRatingFactor,
LanguageModelPenaltyNonFreqDictWord,
LanguageModelPenaltyNonDictWord,
LanguageModelPenaltyPunc,
LanguageModelPenaltyCase,
LanguageModelPenaltyScript,
LanguageModelPenaltyChartype,
LanguageModelPenaltyFont,
LanguageModelPenaltySpacing,
LanguageModelPenaltyIncrement,
NoiseCertBasechar,
NoiseCertDisjoint,
NoiseCertPunc,
NoiseCertFactor,
QualityRejPc,
QualityBlobPc,
QualityOutlinePc,
QualityCharPc,
TestPtX,
TestPtY,
TesseditRejectDocPercent,
TesseditRejectBlockPercent,
TesseditRejectRowPercent,
TesseditWholeWdRejRowPercent,
TesseditGoodDocStillRowrejWd,
QualityRowrejPc,
CrunchTerribleRating,
CrunchPoorGarbageCert,
CrunchPoorGarbageRate,
CrunchPotPoorRate,
CrunchPotPoorCert,
CrunchDelRating,
CrunchDelCert,
CrunchDelMinHt,
CrunchDelMaxHt,
CrunchDelMinWidth,
CrunchDelHighWord,
CrunchDelLowWord,
CrunchSmallOutlinesSize,
FixspSmallOutlinesSize,
SuperscriptWorseCertainty,
SuperscriptBetteredCertainty,
SuperscriptScaledownRatio,
SubscriptMaxYTop,
SuperscriptMinYBottom,
SuspectRatingPerCh,
SuspectAcceptRating,
TesseditLowerFlipHyphen,
TesseditUpperFlipHyphen,
RejWholeOfMostlyRejectWordFract,
MinOrientationMargin,
TextordTabfindVerticalTextRatio,
TextordTabfindAlignedGapFraction,
TospOldSpKnThFactor,
TospThresholdBias1,
TospThresholdBias2,
TospNarrowFraction,
TospNarrowAspectRatio,
TospWideFraction,
TospWideAspectRatio,
TospFuzzySpaceFactor,
TospFuzzySpaceFactor1,
TospFuzzySpaceFactor2,
TospGapFactor,
TospKernGapFactor1,
TospKernGapFactor2,
TospKernGapFactor3,
TospIgnoreBigGaps,
TospIgnoreVeryBigGaps,
TospRepSpace,
TospEnoughSmallGaps,
TospTableKnSpRatio,
TospTableXhtSpRatio,
TospTableFuzzyKnSpRatio,
TospFuzzyKnFraction,
TospFuzzySpFraction,
TospMinSaneKnSp,
TospInitGuessKnMult,
TospInitGuessXhtMult,
TospMaxSaneKnThresh,
TospFlipCaution,
TospLargeKerning,
TospDontFoolWithSmallKerns,
TospNearLhEdge,
TospSillyKnSpGap,
TospPassWideFuzzSpToContext,
TextordNoiseAreaRatio,
TextordInitialxIle,
TextordInitialascIle,
TextordNoiseSizelimit,
TextordNoiseNormratio,
TextordNoiseSyfract,
TextordNoiseSxfract,
TextordNoiseHfract,
TextordNoiseRowratio,
TextordBlshiftMaxshift,
TextordBlshiftXfraction,
}
Expand description
Enum representing different variable options accepted by Tesseract
Variants§
ClassifyNumCpLevels
Number of Class Pruner Levels
Example value: "3"
TextordDotmatrixGap
Max pixel gap for broken pixed pitch
Example value: "3"
TextordDebugBlock
Block to do debug on
Example value: "0"
TextordPitchRange
Max range test on pitch
Example value: "2"
TextordWordsVetoPower
Rows required to outvote a veto
Example value: "5"
TextordTabfindShowStrokewidths
Show stroke widths
Example value: "0"
PitsyncLinearVersion
Use new fast algorithm
Example value: "6"
PitsyncFakeDepth
Max advance fake generation
Example value: "1"
OldblHoledLosscount
Max lost before fallback line used
Example value: "10"
TextordSkewsmoothOffset
For smooth factor
Example value: "4"
TextordSkewsmoothOffset2
For smooth factor
Example value: "1"
TextordTestX
coord of test pt
Example value: "-2147483647"
TextordTestY
coord of test pt
Example value: "-2147483647"
TextordMinBlobsInRow
Min blobs before gradient counted
Example value: "4"
TextordSplineMinblobs
Min blobs in each spline segment
Example value: "8"
TextordSplineMedianwin
Size of window for spline segmentation
Example value: "6"
TextordMaxBlobOverlaps
Max number of blobs a big blob can overlap
Example value: "4"
TextordMinXheight
Min credible pixel xheight
Example value: "10"
TextordLmsLineTrials
Number of linew fits to do
Example value: "12"
TextordTabfindShowImages
Show image blobs
Example value: "0"
TextordFpChopError
Max allowed bending of chop cells
Example value: "2"
EdgesMaxChildrenPerOutline
Max number of children inside a character outline
Example value: "10"
EdgesMaxChildrenLayers
Max layers of nested children inside a character outline
Example value: "5"
EdgesChildrenPerGrandchild
Importance ratio for chucking outlines
Example value: "10"
EdgesChildrenCountLimit
Max holes allowed in blob
Example value: "45"
EdgesMinNonhole
Min pixels for potential char in box
Example value: "12"
EdgesPathareaRatio
Max lensq/area for acceptable child outline
Example value: "40"
DevanagariSplitDebuglevel
Debug level for split shiro-rekha process.
Example value: "0"
TextordTabfindShowPartitions
Show partition bounds, waiting if >1
Example value: "0"
TextordDebugTabfind
Debug tab finding
Example value: "0"
TextordDebugBugs
Turn on output related to bugs in tab finding
Example value: "0"
TextordTestregionLeft
Left edge of debug reporting rectangle
Example value: "-1"
TextordTestregionTop
Top edge of debug reporting rectangle
Example value: "-1"
TextordTestregionRight
Right edge of debug rectangle
Example value: "2147483647"
TextordTestregionBottom
Bottom edge of debug rectangle
Example value: "2147483647"
EditorImageXpos
Editor image X Pos
Example value: "590"
EditorImageYpos
Editor image Y Pos
Example value: "10"
EditorImageMenuheight
Add to image height for menu bar
Example value: "50"
EditorImageWordBbColor
Word bounding box colour
Example value: "7"
EditorImageBlobBbColor
Blob bounding box colour
Example value: "4"
EditorImageTextColor
Correct text colour
Example value: "2"
EditorDbwinXpos
Editor debug window X Pos
Example value: "50"
EditorDbwinYpos
Editor debug window Y Pos
Example value: "500"
EditorDbwinHeight
Editor debug window height
Example value: "24"
EditorDbwinWidth
Editor debug window width
Example value: "80"
EditorWordXpos
Word window X Pos
Example value: "60"
EditorWordYpos
Word window Y Pos
Example value: "510"
EditorWordHeight
Word window height
Example value: "240"
EditorWordWidth
Word window width
Example value: "655"
WordrecDisplaySplits
Display splits
Example value: "0"
PolyDebug
Debug old poly
Example value: "0"
PolyWideObjectsBetter
More accurate approx on wide things
Example value: "1"
WordrecDisplayAllBlobs
Display Blobs
Example value: "0"
WordrecBlobPause
Blob pause
Example value: "0"
TextordFpChopping
Do fixed pitch chopping
Example value: "1"
TextordForceMakePropWords
Force proportional word segmentation on all rows
Example value: "0"
TextordChopperTest
Chopper is being tested.
Example value: "0"
TextordRestoreUnderlines
Chop underlines & put back
Example value: "1"
TextordShowInitialWords
Display separate words
Example value: "0"
TextordShowNewWords
Display separate words
Example value: "0"
TextordShowFixedWords
Display forced fixed pitch words
Example value: "0"
TextordBlocksallFixed
Moan about prop blocks
Example value: "0"
TextordBlocksallProp
Moan about fixed pitch blocks
Example value: "0"
TextordBlocksallTesting
Dump stats when moaning
Example value: "0"
TextordTestMode
Do current test
Example value: "0"
TextordPitchScalebigwords
Scale scores on big words
Example value: "0"
TextordAllProp
All doc is proportial text
Example value: "0"
TextordDebugPitchTest
Debug on fixed pitch test
Example value: "0"
TextordDisablePitchTest
Turn off dp fixed pitch algorithm
Example value: "0"
TextordFastPitchTest
Do even faster pitch algorithm
Example value: "0"
TextordDebugPitchMetric
Write full metric stuff
Example value: "0"
TextordShowRowCuts
Draw row-level cuts
Example value: "0"
TextordShowPageCuts
Draw page-level cuts
Example value: "0"
TextordPitchCheat
Use correct answer for fixed/prop
Example value: "0"
TextordBlockndocFixed
Attempt whole doc/block fixed pitch
Example value: "0"
TextordShowTables
Show table regions
Example value: "0"
TextordTablefindShowMark
Debug table marking steps in detail
Example value: "0"
TextordTablefindShowStats
Show page stats used in table finding
Example value: "0"
TextordTablefindRecognizeTables
Enables the table recognizer for table layout and filtering.
Example value: "0"
TextordTabfindShowInitialtabs
Show tab candidates
Example value: "0"
TextordTabfindShowFinaltabs
Show tab vectors
Example value: "0"
TextordTabfindOnlyStrokewidths
Only run stroke widths
Example value: "0"
TextordReallyOldXheight
Use original wiseowl xheight
Example value: "0"
TextordOldblDebug
Debug old baseline generation
Example value: "0"
TextordDebugBaselines
Debug baseline generation
Example value: "0"
TextordOldblParadef
Use para default mechanism
Example value: "1"
TextordOldblSplitSplines
Split stepped splines
Example value: "1"
TextordOldblMergeParts
Merge suspect partitions
Example value: "1"
OldblCorrfix
Improve correlation of heights
Example value: "1"
OldblXhfix
Fix bug in modes threshold for xheights
Example value: "0"
TextordOcropusMode
Make baselines for ocropus
Example value: "0"
TextordHeavyNr
Vigorously remove noise
Example value: "0"
TextordShowInitialRows
Display row accumulation
Example value: "0"
TextordShowParallelRows
Display page correlated rows
Example value: "0"
TextordShowExpandedRows
Display rows after expanding
Example value: "0"
TextordShowFinalRows
Display rows after final fitting
Example value: "0"
TextordShowFinalBlobs
Display blob bounds after pre-ass
Example value: "0"
TextordTestLandscape
Tests refer to land/port
Example value: "0"
TextordParallelBaselines
Force parallel baselines
Example value: "1"
TextordStraightBaselines
Force straight baselines
Example value: "0"
TextordOldBaselines
Use old baseline algorithm
Example value: "1"
TextordOldXheight
Use old xheight algorithm
Example value: "0"
TextordFixXheightBug
Use spline baseline
Example value: "1"
TextordFixMakerowBug
Prevent multiple baselines
Example value: "1"
TextordDebugXheights
Test xheight algorithms
Example value: "0"
TextordBiasedSkewcalc
Bias skew estimates with line length
Example value: "1"
TextordInterpolatingSkew
Interpolate across gaps
Example value: "1"
TextordNewInitialXheight
Use test xheight mechanism
Example value: "1"
TextordDebugBlob
Print test blob information
Example value: "0"
GapmapDebug
Say which blocks have tables
Example value: "0"
GapmapUseEnds
Use large space at start and end of rows
Example value: "0"
GapmapNoIsolatedQuanta
Ensure gaps not less than 2quanta wide
Example value: "0"
EdgesUseNewOutlineComplexity
Use the new outline complexity module
Example value: "0"
EdgesDebug
turn on debugging for this module
Example value: "0"
EdgesChildrenFix
Remove boxy parents of char-like children
Example value: "0"
TextordShowFixedCuts
Draw fixed pitch cell boundaries
Example value: "0"
DevanagariSplitDebugimage
Whether to create a debug image for split shiro-rekha process.
Example value: "0"
TextordTabfindShowInitialPartitions
Show partition bounds
Example value: "0"
TextordTabfindShowRejectBlobs
Show blobs rejected as noise
Example value: "0"
TextordTabfindShowColumns
Show column bounds
Example value: "0"
TextordTabfindShowBlocks
Show final block bounds
Example value: "0"
TextordTabfindFindTables
run table detection
Example value: "1"
TextordSpaceSizeIsVariable
If true, word delimiter spaces are assumed to have variable width, even though characters have fixed pitch.
Example value: "0"
TextordDebugPrintable
Make debug windows printable
Example value: "0"
EquationdetectSaveBiImage
Save input bi image
Example value: "0"
EquationdetectSaveSptImage
Save special character image
Example value: "0"
EquationdetectSaveSeedImage
Save the seed image
Example value: "0"
EquationdetectSaveMergedImage
Save the merged image
Example value: "0"
StreamFilelist
Stream a filelist from stdin
Example value: "0"
DebugFile
File to send tprintf output to
Dotproduct
Function used for calculation of dot product
Example value: "generic"
ClassifyFontName
Default font name to be used in training
Example value: "UnknownFont"
FxDebugfile
Name of debugfile
Example value: "FXDebug"
EditorImageWinName
Editor image window name
Example value: "EditorImage"
EditorDbwinName
Editor debug window name
Example value: "EditorDBWin"
EditorWordName
BL normalized word window
Example value: "BlnWords"
DocumentTitle
Title of output document (used for hOCR and PDF output)
ClassifyPicoFeatureLength
Pico Feature Length
Example value: "0.05"
ClassifyNormAdjMidpoint
Norm adjust midpoint ...
Example value: "32"
ClassifyNormAdjCurl
Norm adjust curl ...
Example value: "2"
ClassifyMinSlope
Slope below which lines are called horizontal
Example value: "0.414214"
ClassifyMaxSlope
Slope above which lines are called vertical
Example value: "2.41421"
ClassifyCpAnglePadLoose
Class Pruner Angle Pad Loose
Example value: "45"
ClassifyCpAnglePadMedium
Class Pruner Angle Pad Medium
Example value: "20"
ClassifyCpAnglePadTight
CLass Pruner Angle Pad Tight
Example value: "10"
ClassifyCpEndPadLoose
Class Pruner End Pad Loose
Example value: "0.5"
ClassifyCpEndPadMedium
Class Pruner End Pad Medium
Example value: "0.5"
ClassifyCpEndPadTight
Class Pruner End Pad Tight
Example value: "0.5"
ClassifyCpSidePadLoose
Class Pruner Side Pad Loose
Example value: "2.5"
ClassifyCpSidePadMedium
Class Pruner Side Pad Medium
Example value: "1.2"
ClassifyCpSidePadTight
Class Pruner Side Pad Tight
Example value: "0.6"
ClassifyPpAnglePad
Proto Pruner Angle Pad
Example value: "45"
ClassifyPpEndPad
Proto Prune End Pad
Example value: "0.5"
ClassifyPpSidePad
Proto Pruner Side Pad
Example value: "2.5"
TextordUnderlineOffset
Fraction of x to ignore
Example value: "0.1"
TextordWordstatsSmoothFactor
Smoothing gap stats
Example value: "0.05"
TextordWidthSmoothFactor
Smoothing width stats
Example value: "0.1"
TextordWordsWidthIle
Ile of blob widths for space est
Example value: "0.4"
TextordWordsMaxspace
Multiple of xheight
Example value: "4"
TextordWordsDefaultMaxspace
Max believable third space
Example value: "3.5"
TextordWordsDefaultMinspace
Fraction of xheight
Example value: "0.6"
TextordWordsMinMinspace
Fraction of xheight
Example value: "0.3"
TextordWordsDefaultNonspace
Fraction of xheight
Example value: "0.2"
TextordWordsInitialLower
Max initial cluster size
Example value: "0.25"
TextordWordsInitialUpper
Min initial cluster spacing
Example value: "0.15"
TextordWordsMinlarge
Fraction of valid gaps needed
Example value: "0.75"
TextordWordsPitchsdThreshold
Pitch sync threshold
Example value: "0.04"
TextordWordsDefFixed
Threshold for definite fixed
Example value: "0.016"
TextordWordsDefProp
Threshold for definite prop
Example value: "0.09"
TextordPitchRowsimilarity
Fraction of xheight for sameness
Example value: "0.08"
WordsInitialLower
Max initial cluster size
Example value: "0.5"
WordsInitialUpper
Min initial cluster spacing
Example value: "0.15"
WordsDefaultPropNonspace
Fraction of xheight
Example value: "0.25"
WordsDefaultFixedSpace
Fraction of xheight
Example value: "0.75"
WordsDefaultFixedLimit
Allowed size variance
Example value: "0.6"
TextordWordsDefiniteSpread
Non-fuzzy spacing region
Example value: "0.3"
TextordSpacesizeRatiofp
Min ratio space/nonspace
Example value: "2.8"
TextordSpacesizeRatioprop
Min ratio space/nonspace
Example value: "2"
TextordFpiqrRatio
Pitch IQR/Gap IQR threshold
Example value: "1.5"
TextordMaxPitchIqr
Xh fraction noise in pitch
Example value: "0.2"
TextordFpMinWidth
Min width of decent blobs
Example value: "0.5"
TextordProjectionScale
Ding rate for mid-cuts
Example value: "0.2"
TextordBalanceFactor
Ding rate for unbalanced char cells
Example value: "1"
TextordTabvectorVerticalGapFraction
max fraction of mean blob width allowed for vertical gaps in vertical text
Example value: "0.5"
TextordTabvectorVerticalBoxRatio
Fraction of box matches required to declare a line vertical
Example value: "0.5"
PitsyncJoinedEdge
Dist inside big blob for chopping
Example value: "0.75"
PitsyncOffsetFreecutFraction
Fraction of cut for free cuts
Example value: "0.25"
OldblXhfract
Fraction of est allowed in calc
Example value: "0.4"
OldblDotErrorSize
Max aspect ratio of a dot
Example value: "1.26"
TextordOldblJumplimit
X fraction for new partition
Example value: "0.15"
TextordSplineShiftFraction
Fraction of line spacing for quad
Example value: "0.02"
TextordSplineOutlierFraction
Fraction of line spacing for outlier
Example value: "0.1"
TextordSkewIle
Ile of gradients for page skew
Example value: "0.5"
TextordSkewLag
Lag for skew on row accumulation
Example value: "0.02"
TextordLinespaceIqrlimit
Max iqr/median for linespace
Example value: "0.2"
TextordWidthLimit
Max width of blobs to make rows
Example value: "8"
TextordChopWidth
Max width before chopping
Example value: "1.5"
TextordExpansionFactor
Factor to expand rows by in expand_rows
Example value: "1"
TextordOverlapX
Fraction of linespace for good overlap
Example value: "0.375"
TextordMinxh
fraction of linesize for min xheight
Example value: "0.25"
TextordMinLinesize
* blob height for initial linesize
Example value: "1.25"
TextordExcessBlobsize
New row made if blob makes row this big
Example value: "1.3"
TextordOccupancyThreshold
Fraction of neighbourhood
Example value: "0.4"
TextordUnderlineWidth
Multiple of line_size for underline
Example value: "2"
TextordMinBlobHeightFraction
Min blob height/top to include blob top into xheight stats
Example value: "0.75"
TextordXheightModeFraction
Min pile height to make xheight
Example value: "0.4"
TextordAscheightModeFraction
Min pile height to make ascheight
Example value: "0.08"
TextordDescheightModeFraction
Min pile height to make descheight
Example value: "0.08"
TextordAscxRatioMin
Min cap/xheight
Example value: "1.25"
TextordAscxRatioMax
Max cap/xheight
Example value: "1.8"
TextordDescxRatioMin
Min desc/xheight
Example value: "0.25"
TextordDescxRatioMax
Max desc/xheight
Example value: "0.6"
TextordXheightErrorMargin
Accepted variation
Example value: "0.1"
GapmapBigGaps
xht multiplier
Example value: "1.75"
TextordFpChopSnap
Max distance of chop pt from vertex
Example value: "0.5"
EdgesChildarea
Min area fraction of child outline
Example value: "0.5"
EdgesBoxarea
Min area fraction of grandchild for box
Example value: "0.875"
TextordUnderlineThreshold
Fraction of width occupied
Example value: "0.5"
AmbigsDebugLevel
Debug level for unichar ambiguities
Example value: "0"
ClassifyDebugLevel
Classify debug level
Example value: "0"
ClassifyNormMethod
Normalization Method ...
Example value: "1"
MatcherDebugLevel
Matcher Debug Level
Example value: "0"
MatcherDebugFlags
Matcher Debug Flags
Example value: "0"
ClassifyLearningDebugLevel
Learning Debug Level:
Example value: "0"
MatcherPermanentClassesMin
Min # of permanent classes
Example value: "1"
MatcherMinExamplesForPrototyping
Reliable Config Threshold
Example value: "3"
MatcherSufficientExamplesForPrototyping
Enable adaption even if the ambiguities have not been seen
Example value: "5"
ClassifyAdaptProtoThreshold
Threshold for good protos during adaptive 0-255
Example value: "230"
ClassifyAdaptFeatureThreshold
Threshold for good features during adaptive 0-255
Example value: "230"
ClassifyClassPrunerThreshold
Class Pruner Threshold 0-255
Example value: "229"
ClassifyClassPrunerMultiplier
Class Pruner Multiplier 0-255:
Example value: "15"
ClassifyCpCutoffStrength
Class Pruner CutoffStrength:
Example value: "7"
ClassifyIntegerMatcherMultiplier
Integer Matcher Multiplier 0-255:
Example value: "10"
DawgDebugLevel
Set to 1 for general debug info, to 2 for more details, to 3 to see all the debug messages
Example value: "0"
HyphenDebugLevel
Debug level for hyphenated words.
Example value: "0"
StopperSmallwordSize
Size of dict word to be treated as non-dict word
Example value: "2"
StopperDebugLevel
Stopper debug level
Example value: "0"
TesseditTruncateWordchoiceLog
Max words to keep in list
Example value: "10"
MaxPermuterAttempts
Maximum number of different character choices to consider during permutation. This limit is especially useful when user patterns are specified, since overly generic patterns can result in dawg search exploring an overly large number of options.
Example value: "10000"
RepairUnchoppedBlobs
Fix blobs that aren’t chopped
Example value: "1"
ChopDebug
Chop debug
Example value: "0"
ChopSplitLength
Split Length
Example value: "10000"
ChopSameDistance
Same distance
Example value: "2"
ChopMinOutlinePoints
Min Number of Points on Outline
Example value: "6"
ChopSeamPileSize
Max number of seams in seam_pile
Example value: "150"
ChopInsideAngle
Min Inside Angle Bend
Example value: "-50"
ChopMinOutlineArea
Min Outline Area
Example value: "2000"
ChopCenteredMaxwidth
Width of (smaller) chopped blobs above which we don’t care that a chop is not near the center.
Example value: "90"
ChopXyWeight
X / Y length weight
Example value: "3"
WordrecDebugLevel
Debug level for wordrec
Example value: "0"
WordrecMaxJoinChunks
Max number of broken pieces to associate
Example value: "4"
SegsearchDebugLevel
SegSearch debug level
Example value: "0"
SegsearchMaxPainPoints
Maximum number of pain points stored in the queue
Example value: "2000"
SegsearchMaxFutileClassifications
Maximum number of pain point classifications per chunk that did not result in finding a better word choice.
Example value: "20"
LanguageModelDebugLevel
Language model debug level
Example value: "0"
LanguageModelNgramOrder
Maximum order of the character ngram model
Example value: "8"
LanguageModelViterbiListMaxNumPrunable
Maximum number of prunable (those for which PrunablePath() is true) entries in each viterbi list recorded in BLOB_CHOICEs
Example value: "10"
LanguageModelViterbiListMaxSize
Maximum size of viterbi lists recorded in BLOB_CHOICEs
Example value: "500"
LanguageModelMinCompoundLength
Minimum length of compound words
Example value: "3"
WordrecDisplaySegmentations
Display Segmentations
Example value: "0"
TesseditPagesegMode
Page seg mode: 0=osd only, 1=auto+osd, 2=auto_only, 3=auto, 4=column, 5=block_vert, 6=block, 7=line, 8=word, 9=word_circle, 10=char,11=sparse_text, 12=sparse_text+osd, 13=raw_line (Values from PageSegMode enum in publictypes.h)
Example value: "6"
TesseditOcrEngineMode
Which OCR engine(s) to run (Tesseract, LSTM, both). Defaults to loading and running the most accurate available.
Example value: "1"
PagesegDevanagariSplitStrategy
Whether to use the top-line splitting process for Devanagari documents while performing page-segmentation.
Example value: "0"
OcrDevanagariSplitStrategy
Whether to use the top-line splitting process for Devanagari documents while performing ocr.
Example value: "0"
BidiDebug
Debug level for BiDi
Example value: "0"
ApplyboxDebug
Debug level
Example value: "1"
ApplyboxPage
Page number to apply boxes from
Example value: "0"
TesseditBigramDebug
Amount of debug output for bigram correction.
Example value: "0"
DebugNoiseRemoval
Debug reassignment of small outlines
Example value: "0"
NoiseMaxperblob
Max diacritics to apply to a blob
Example value: "8"
NoiseMaxperword
Max diacritics to apply to a word
Example value: "16"
DebugXHtLevel
Reestimate debug
Example value: "0"
QualityMinInitialAlphasReqd
alphas in a good word
Example value: "2"
TesseditTessAdaptionMode
Adaptation decision algorithm for tess
Example value: "39"
MultilangDebugLevel
Print multilang debug info.
Example value: "0"
ParagraphDebugLevel
Print paragraph debug info.
Example value: "0"
TesseditPreserveMinWdLen
Only preserve wds longer than this
Example value: "2"
CrunchRatingMax
For adj length in rating per ch
Example value: "10"
CrunchPotIndicators
How many potential indicators needed
Example value: "1"
CrunchLeaveLcStrings
Don’t crunch words with long lower case strings
Example value: "4"
CrunchLeaveUcStrings
Don’t crunch words with long lower case strings
Example value: "4"
CrunchLongRepetitions
Crunch words with long repetitions
Example value: "3"
CrunchDebug
As it says
Example value: "0"
FixspNonNoiseLimit
How many non-noise blbs either side?
Example value: "1"
FixspDoneMode
What constitues done for spacing
Example value: "1"
DebugFixSpaceLevel
Contextual fixspace debug
Example value: "0"
XHtAcceptanceTolerance
Max allowed deviation of blob top outside of font data
Example value: "8"
XHtMinChange
Min change in xht before actually trying it
Example value: "8"
SuperscriptDebug
Debug level for sub & superscript fixer
Example value: "0"
JpgQuality
Set JPEG quality level
Example value: "85"
UserDefinedDpi
Specify DPI for input image
Example value: "0"
MinCharactersToTry
Specify minimum characters to try during OSD
Example value: "50"
SuspectLevel
Suspect marker level
Example value: "99"
SuspectShortWords
Don’t suspect dict wds longer than this
Example value: "2"
TesseditRejectMode
Rejection algorithm
Example value: "0"
TesseditImageBorder
Rej blbs near image edge limit
Example value: "2"
MinSaneXHtPixels
Reject any x-ht lt or eq than this
Example value: "8"
TesseditPageNumber
-1 -> All pages, else specific page to process
Example value: "-1"
TesseditParallelize
Run in parallel where possible
Example value: "0"
LstmChoiceMode
Allows to include alternative symbols choices in the hOCR output. Valid input values are 0, 1, 2 and 3. 0 is the default value. With 1 the alternative symbol choices per timestep are included. With 2 the alternative symbol choices are accumulated per character.
Example value: "0"
TospDebugLevel
Debug data
Example value: "0"
TospEnoughSpaceSamplesForMedian
or should we use mean
Example value: "3"
TospRedoKernLimit
No.samples reqd to reestimate for row
Example value: "10"
TospFewSamples
No.gaps reqd with 1 large gap to treat as a table
Example value: "40"
TospShortRow
No.gaps reqd with few cert spaces to use certs
Example value: "20"
TospSanityMethod
How to avoid being silly
Example value: "1"
TextordMaxNoiseSize
Pixel size of noise
Example value: "7"
TextordBaselineDebug
Baseline debug level
Example value: "0"
TextordNoiseSizefraction
Fraction of size for maxima
Example value: "10"
TextordNoiseTranslimit
Transitions for normal blob
Example value: "16"
TextordNoiseSncount
super norm blobs to save row
Example value: "1"
UseAmbigsForAdaption
Use ambigs for deciding whether to adapt to a character
Example value: "0"
AllowBlobDivision
Use divisible blobs chopping
Example value: "1"
PrioritizeDivision
Prioritize blob division over chopping
Example value: "0"
ClassifyEnableLearning
Enable adaptive classifier
Example value: "1"
TessCnMatching
Character Normalized Matching
Example value: "0"
TessBnMatching
Baseline Normalized Matching
Example value: "0"
ClassifyEnableAdaptiveMatcher
Enable adaptive classifier
Example value: "1"
ClassifyUsePreAdaptedTemplates
Use pre-adapted classifier templates
Example value: "0"
ClassifySaveAdaptedTemplates
Save adapted templates to a file
Example value: "0"
ClassifyEnableAdaptiveDebugger
Enable match debugger
Example value: "0"
ClassifyNonlinearNorm
Non-linear stroke-density normalization
Example value: "0"
DisableCharacterFragments
Do not include character fragments in the results of the classifier
Example value: "1"
ClassifyDebugCharacterFragments
Bring up graphical debugging windows for fragments training
Example value: "0"
MatcherDebugSeparateWindows
Use two different windows for debugging the matching: One for the protos and one for the features.
Example value: "0"
ClassifyBlnNumericMode
Assume the input is numbers [0-9].
Example value: "0"
LoadSystemDawg
Load system word dawg.
Example value: "1"
LoadFreqDawg
Load frequent word dawg.
Example value: "1"
LoadUnambigDawg
Load unambiguous word dawg.
Example value: "1"
LoadPuncDawg
Load dawg with punctuation patterns.
Example value: "1"
LoadNumberDawg
Load dawg with number patterns.
Example value: "1"
LoadBigramDawg
Load dawg with special word bigrams.
Example value: "1"
UseOnlyFirstUft8Step
Use only the first UTF8 step of the given string when computing log probabilities.
Example value: "0"
StopperNoAcceptableChoices
Make AcceptableChoice() always return false. Useful when there is a need to explore all segmentations
Example value: "0"
SegmentNonalphabeticScript
Don’t use any alphabetic-specific tricks. Set to true in the traineddata config file for scripts that are cursive or inherently fixed-pitch
Example value: "0"
SaveDocWords
Save Document Words
Example value: "0"
MergeFragmentsInMatrix
Merge the fragments in the ratings matrix and delete them after merging
Example value: "1"
WordrecEnableAssoc
Associator Enable
Example value: "1"
ForceWordAssoc
force associator to run regardless of what enable_assoc is. This is used for CJK where component grouping is necessary.
Example value: "0"
ChopEnable
Chop enable
Example value: "1"
ChopVerticalCreep
Vertical creep
Example value: "0"
ChopNewSeamPile
Use new seam_pile
Example value: "1"
AssumeFixedPitchCharSegment
include fixed-pitch heuristics in char segmentation
Example value: "0"
WordrecSkipNoTruthWords
Only run OCR for words that had truth recorded in BlamerBundle
Example value: "0"
WordrecDebugBlamer
Print blamer debug messages
Example value: "0"
WordrecRunBlamer
Try to set the blame for errors
Example value: "0"
SaveAltChoices
Save alternative paths found during chopping and segmentation search
Example value: "1"
LanguageModelNgramOn
Turn on/off the use of character ngram model
Example value: "0"
LanguageModelNgramUseOnlyFirstUft8Step
Use only the first UTF8 step of the given string when computing log probabilities.
Example value: "0"
LanguageModelNgramSpaceDelimitedLanguage
Words are delimited by space
Example value: "1"
LanguageModelUseSigmoidalCertainty
Use sigmoidal score for certainty
Example value: "0"
TesseditResegmentFromBoxes
Take segmentation and labeling from box file
Example value: "0"
TesseditResegmentFromLineBoxes
Conversion of word/line box file to char box file
Example value: "0"
TesseditTrainFromBoxes
Generate training data from boxed chars
Example value: "0"
TesseditMakeBoxesFromBoxes
Generate more boxes from boxed chars
Example value: "0"
TesseditTrainLineRecognizer
Break input into lines and remap boxes if present
Example value: "0"
TesseditDumpPagesegImages
Dump intermediate images made during page segmentation
Example value: "0"
TesseditDoInvert
Try inverting the image in `LSTMRecognizeWord`
Example value: "1"
TesseditAmbigsTraining
Perform training for ambiguities
Example value: "0"
TesseditAdaptionDebug
Generate and print debug information for adaption
Example value: "0"
ApplyboxLearnCharsAndCharFragsMode
Learn both character fragments (as is done in the special low exposure mode) as well as unfragmented characters.
Example value: "0"
ApplyboxLearnNgramsMode
Each bounding box is assumed to contain ngrams. Only learn the ngrams whose outlines overlap horizontally.
Example value: "0"
TesseditDisplayOutwords
Draw output words
Example value: "0"
TesseditDumpChoices
Dump char choices
Example value: "0"
TesseditTimingDebug
Print timing stats
Example value: "0"
TesseditFixFuzzySpaces
Try to improve fuzzy spaces
Example value: "1"
TesseditUnrejAnyWd
Don’t bother with word plausibility
Example value: "0"
TesseditFixHyphens
Crunch double hyphens?
Example value: "1"
TesseditEnableDocDict
Add words to the document dictionary
Example value: "1"
TesseditDebugFonts
Output font info per char
Example value: "0"
TesseditDebugBlockRejection
Block and Row stats
Example value: "0"
TesseditEnableBigramCorrection
Enable correction based on the word bigram dictionary.
Example value: "1"
TesseditEnableDictCorrection
Enable single word correction based on the dictionary.
Example value: "0"
EnableNoiseRemoval
Remove and conditionally reassign small outlines when they confuse layout analysis, determining diacritics vs noise
Example value: "1"
TesseditMinimalRejPass1
Do minimal rejection on pass 1 output
Example value: "0"
TesseditTestAdaption
Test adaption criteria
Example value: "0"
TestPt
Test for point
Example value: "0"
ParagraphTextBased
Run paragraph detection on the post-text-recognition (more accurate)
Example value: "1"
LstmUseMatrix
Use ratings matrix/beam search with lstm
Example value: "1"
TesseditGoodQualityUnrej
Reduce rejection on good docs
Example value: "1"
TesseditUseRejectSpaces
Reject spaces?
Example value: "1"
TesseditPreserveBlkRejPerfectWds
Only rej partially rejected words in block rejection
Example value: "1"
TesseditPreserveRowRejPerfectWds
Only rej partially rejected words in row rejection
Example value: "1"
TesseditDontBlkrejGoodWds
Use word segmentation quality metric
Example value: "0"
TesseditDontRowrejGoodWds
Use word segmentation quality metric
Example value: "0"
TesseditRowRejGoodDocs
Apply row rejection to good docs
Example value: "1"
TesseditRejectBadQualWds
Reject all bad quality wds
Example value: "1"
TesseditDebugDocRejection
Page stats
Example value: "0"
TesseditDebugQualityMetrics
Output data to debug file
Example value: "0"
BlandUnrej
unrej potential with no checks
Example value: "0"
UnlvTildeCrunching
Mark v.bad words for tilde crunch
Example value: "0"
HocrFontInfo
Add font info to hocr output
Example value: "0"
HocrCharBoxes
Add coordinates for each character to hocr output
Example value: "0"
CrunchEarlyMergeTessFails
Before word crunch?
Example value: "1"
CrunchEarlyConvertBadUnlvChs
Take out ~^ early?
Example value: "0"
CrunchTerribleGarbage
As it says
Example value: "1"
CrunchLeaveOkStrings
Don’t touch sensible strings
Example value: "1"
CrunchAcceptOk
Use acceptability in okstring
Example value: "1"
CrunchLeaveAcceptStrings
Don’t pot crunch sensible strings
Example value: "0"
CrunchIncludeNumerals
Fiddle alpha figures
Example value: "0"
TesseditPreferJoinedPunct
Reward punctuation joins
Example value: "0"
TesseditWriteBlockSeparators
Write block separators in output
Example value: "0"
TesseditWriteRepCodes
Write repetition char code
Example value: "0"
TesseditWriteUnlv
Write .unlv output file
Example value: "0"
TesseditCreateTxt
Write .txt output file
Example value: "0"
TesseditCreateHocr
Write .html hOCR output file
Example value: "0"
TesseditCreateAlto
Write .xml ALTO file
Example value: "0"
TesseditCreateLstmbox
Write .box file for LSTM training
Example value: "0"
TesseditCreateTsv
Write .tsv output file
Example value: "0"
TesseditCreateWordstrbox
Write WordStr format .box output file
Example value: "0"
TesseditCreatePdf
Write .pdf output file
Example value: "0"
TextonlyPdf
Create PDF with only one invisible text layer
Example value: "0"
SuspectConstrain1Il
UNLV keep 1Il chars rejected
Example value: "0"
TesseditMinimalRejection
Only reject tess failures
Example value: "0"
TesseditZeroRejection
Don’t reject ANYTHING
Example value: "0"
TesseditWordForWord
Make output have exactly one word per WERD
Example value: "0"
TesseditZeroKelvinRejection
Don’t reject ANYTHING AT ALL
Example value: "0"
TesseditRejectionDebug
Adaption debug
Example value: "0"
TesseditFlip0O
Contextual 0O O0 flips
Example value: "1"
RejTrustDocDawg
Use DOC dawg in 11l conf. detector
Example value: "0"
Rej1IlUseDictWord
Use dictword test
Example value: "0"
Rej1IlTrustPermuterType
Don’t double check
Example value: "1"
RejUseTessAccepted
Individual rejection control
Example value: "1"
RejUseTessBlanks
Individual rejection control
Example value: "1"
RejUseGoodPerm
Individual rejection control
Example value: "1"
RejUseSensibleWd
Extend permuter check
Example value: "0"
RejAlphasInNumberPerm
Extend permuter check
Example value: "0"
TesseditCreateBoxfile
Output text with boxes
Example value: "0"
TesseditWriteImages
Capture the image from the IPE
Example value: "0"
InteractiveDisplayMode
Run interactively?
Example value: "0"
TesseditOverridePermuter
According to dict_word
Example value: "1"
TesseditUsePrimaryParamsModel
In multilingual mode use params model of the primary language
Example value: "0"
TextordTabfindShowVlines
Debug line finding
Example value: "0"
TextordUseCjkFpModel
Use CJK fixed pitch model
Example value: "0"
PolyAllowDetailedFx
Allow feature extractors to see the original outline
Example value: "0"
TesseditInitConfigOnly
Only initialize with the config file. Useful if the instance is not going to be used for OCR but say only for layout analysis.
Example value: "0"
TextordEquationDetect
Turn on equation detector
Example value: "0"
TextordTabfindVerticalText
Enable vertical detection
Example value: "1"
TextordTabfindForceVerticalText
Force using vertical text page mode
Example value: "0"
PreserveInterwordSpaces
Preserve multiple interword spaces
Example value: "0"
PagesegApplyMusicMask
Detect music staff and remove intersecting components
Example value: "1"
TextordSingleHeightMode
Script has no xheight, so use a single mode
Example value: "0"
TospOldToMethod
Space stats use prechopping?
Example value: "0"
TospOldToConstrainSpKn
Constrain relative values of inter and intra-word gaps for old_to_method.
Example value: "0"
TospOnlyUsePropRows
Block stats to use fixed pitch rows?
Example value: "1"
TospForceWordbreakOnPunct
Force word breaks on punct to break long lines in non-space delimited langs
Example value: "0"
TospUsePreChopping
Space stats use prechopping?
Example value: "0"
TospOldToBugFix
Fix suspected bug in old code
Example value: "0"
TospBlockUseCertSpaces
Only stat OBVIOUS spaces
Example value: "1"
TospRowUseCertSpaces
Only stat OBVIOUS spaces
Example value: "1"
TospNarrowBlobsNotCert
Only stat OBVIOUS spaces
Example value: "1"
TospRowUseCertSpaces1
Only stat OBVIOUS spaces
Example value: "1"
TospRecoveryIsolatedRowStats
Use row alone when inadequate cert spaces
Example value: "1"
TospOnlySmallGapsForKern
Better guess
Example value: "0"
TospAllFlipsFuzzy
Pass ANY flip to context?
Example value: "0"
TospFuzzyLimitAll
Don’t restrict kn->sp fuzzy limit to tables
Example value: "1"
TospStatsUseXhtGaps
Use within xht gap for wd breaks
Example value: "1"
TospUseXhtGaps
Use within xht gap for wd breaks
Example value: "1"
TospOnlyUseXhtGaps
Only use within xht gap for wd breaks
Example value: "0"
TospRule9TestPunct
Don’t chng kn to space next to punct
Example value: "0"
TospFlipFuzzKnToSp
Default flip
Example value: "1"
TospFlipFuzzSpToKn
Default flip
Example value: "1"
TospImproveThresh
Enable improvement heuristic
Example value: "0"
TextordNoRejects
Don’t remove noise blobs
Example value: "0"
TextordShowBlobs
Display unsorted blobs
Example value: "0"
TextordShowBoxes
Display unsorted blobs
Example value: "0"
TextordNoiseRejwords
Reject noise-like words
Example value: "1"
TextordNoiseRejrows
Reject noise-like rows
Example value: "1"
TextordNoiseDebug
Debug row garbage detector
Example value: "0"
ClassifyLearnDebugStr
Class str to debug learning
UserWordsFile
A filename of user-provided words.
UserWordsSuffix
A suffix of user-provided words located in tessdata.
UserPatternsFile
A filename of user-provided patterns.
UserPatternsSuffix
A suffix of user-provided patterns located in tessdata.
OutputAmbigWordsFile
Output file for ambiguities found in the dictionary
WordToDebug
Word for which stopper debug information should be printed to stdout
TesseditCharBlacklist
Blacklist of chars not to recognize
TesseditCharWhitelist
Whitelist of chars to recognize
TesseditCharUnblacklist
List of chars to override tessedit_char_blacklist
TesseditWriteParamsToFile
Write all parameters to the given file.
ApplyboxExposurePattern
Exposure value follows this pattern in the image filename. The name of the image files are expected to be in the form [lang].[fontname].exp[num].tif
Example value: ".exp"
ChsLeadingPunct
Leading punctuation
Example value: "(\'
"“`
ChsTrailingPunct1
1st Trailing punctuation
Example value: ").,;:?!"
ChsTrailingPunct2
2nd Trailing punctuation
Example value: ")\'
"“`
OutlinesOdd
Non standard number of outlines
Example value: "%| "
Outlines2
Non standard number of outlines
Example value: "ij!?%\":;"
NumericPunctuation
Punct. chs expected WITHIN numbers
Example value: ".,"
UnrecognisedChar
Output char for unidentified blobs
Example value: "|"
OkRepeatedChNonAlphanumWds
Allow NN to unrej
Example value: "-?*="
ConflictSetIl1
Il1 conflict set
Example value: "Il1[]"
FileType
Filename extension
Example value: ".tif"
TesseditLoadSublangs
List of languages to load with this one
PageSeparator
Page separator (default is form feed control character)
Example value: "\u{c}"
ClassifyCharNormRange
Character Normalization Range ...
Example value: "0.2"
ClassifyMaxRatingRatio
Veto ratio between classifier ratings
Example value: "1.5"
ClassifyMaxCertaintyMargin
Veto difference between classifier certainties
Example value: "5.5"
MatcherGoodThreshold
Good Match (0-1)
Example value: "0.125"
MatcherReliableAdaptiveResult
Great Match (0-1)
Example value: "0"
MatcherPerfectThreshold
Perfect Match (0-1)
Example value: "0.02"
MatcherBadMatchPad
Bad Match Pad (0-1)
Example value: "0.15"
MatcherRatingMargin
New template margin (0-1)
Example value: "0.1"
MatcherAvgNoiseSize
Avg. noise blob length
Example value: "12"
MatcherClusteringMaxAngleDelta
Maximum angle delta for prototype clustering
Example value: "0.015"
ClassifyMisfitJunkPenalty
Penalty to apply when a non-alnum is vertically out of its expected textline position
Example value: "0"
RatingScale
Rating scaling factor
Example value: "1.5"
CertaintyScale
Certainty scaling factor
Example value: "20"
TesseditClassMissScale
Scale factor for features not used
Example value: "0.00390625"
ClassifyAdaptedPruningFactor
Prune poor adapted results this much worse than best result
Example value: "2.5"
ClassifyAdaptedPruningThreshold
Threshold at which classify_adapted_pruning_factor starts
Example value: "-1"
ClassifyCharacterFragmentsGarbageCertaintyThreshold
Exclude fragments that do not look like whole characters from training and adaption
Example value: "-3"
SpeckleLargeMaxSize
Max large speckle size
Example value: "0.3"
SpeckleRatingPenalty
Penalty to add to worst rating for noise
Example value: "10"
XheightPenaltySubscripts
Score penalty (0.1 = 10%) added if there are subscripts or superscripts in a word, but it is otherwise OK.
Example value: "0.125"
XheightPenaltyInconsistent
Score penalty (0.1 = 10%) added if an xheight is inconsistent.
Example value: "0.25"
SegmentPenaltyDictFrequentWord
Score multiplier for word matches which have good case and are frequent in the given language (lower is better).
Example value: "1"
SegmentPenaltyDictCaseOk
Score multiplier for word matches that have good case (lower is better).
Example value: "1.1"
SegmentPenaltyDictCaseBad
Default score multiplier for word matches, which may have case issues (lower is better).
Example value: "1.3125"
SegmentPenaltyDictNonword
Score multiplier for glyph fragment segmentations which do not match a dictionary word (lower is better).
Example value: "1.25"
SegmentPenaltyGarbage
Score multiplier for poorly cased strings that are not in the dictionary and generally look like garbage (lower is better).
Example value: "1.5"
StopperNondictCertaintyBase
Certainty threshold for non-dict words
Example value: "-2.5"
StopperPhase2CertaintyRejectionOffset
Reject certainty offset
Example value: "1"
StopperCertaintyPerChar
Certainty to add for each dict char above small word size.
Example value: "-0.5"
StopperAllowableCharacterBadness
Max certaintly variation allowed in a word (in sigma)
Example value: "3"
DocDictPendingThreshold
Worst certainty for using pending dictionary
Example value: "0"
DocDictCertaintyThreshold
Worst certainty for words that can be inserted into the document dictionary
Example value: "-2.25"
TesseditCertaintyThreshold
Good blob limit
Example value: "-2.25"
ChopSplitDistKnob
Split length adjustment
Example value: "0.5"
ChopOverlapKnob
Split overlap adjustment
Example value: "0.9"
ChopCenterKnob
Split center adjustment
Example value: "0.15"
ChopSharpnessKnob
Split sharpness adjustment
Example value: "0.06"
ChopWidthChangeKnob
Width change adjustment
Example value: "5"
ChopOkSplit
OK split limit
Example value: "100"
ChopGoodSplit
Good split limit
Example value: "50"
SegsearchMaxCharWhRatio
Maximum character width-to-height ratio
Example value: "2"
LanguageModelNgramSmallProb
To avoid overly small denominators use this as the floor of the probability returned by the ngram model.
Example value: "1e-06"
LanguageModelNgramNonmatchScore
Average classifier score of a non-matching unichar.
Example value: "-40"
LanguageModelNgramScaleFactor
Strength of the character ngram model relative to the character classifier
Example value: "0.03"
LanguageModelNgramRatingFactor
Factor to bring log-probs into the same range as ratings when multiplied by outline length
Example value: "16"
LanguageModelPenaltyNonFreqDictWord
Penalty for words not in the frequent word dictionary
Example value: "0.1"
LanguageModelPenaltyNonDictWord
Penalty for non-dictionary words
Example value: "0.15"
LanguageModelPenaltyPunc
Penalty for inconsistent punctuation
Example value: "0.2"
LanguageModelPenaltyCase
Penalty for inconsistent case
Example value: "0.1"
LanguageModelPenaltyScript
Penalty for inconsistent script
Example value: "0.5"
LanguageModelPenaltyChartype
Penalty for inconsistent character type
Example value: "0.3"
LanguageModelPenaltyFont
Penalty for inconsistent font
Example value: "0"
LanguageModelPenaltySpacing
Penalty for inconsistent spacing
Example value: "0.05"
LanguageModelPenaltyIncrement
Penalty increment
Example value: "0.01"
NoiseCertBasechar
Hingepoint for base char certainty
Example value: "-8"
NoiseCertDisjoint
Hingepoint for disjoint certainty
Example value: "-1"
NoiseCertPunc
Threshold for new punc char certainty
Example value: "-3"
NoiseCertFactor
Scaling on certainty diff from Hingepoint
Example value: "0.375"
QualityRejPc
good_quality_doc lte rejection limit
Example value: "0.08"
QualityBlobPc
good_quality_doc gte good blobs limit
Example value: "0"
QualityOutlinePc
good_quality_doc lte outline error limit
Example value: "1"
QualityCharPc
good_quality_doc gte good char limit
Example value: "0.95"
TestPtX
xcoord
Example value: "100000"
TestPtY
ycoord
Example value: "100000"
TesseditRejectDocPercent
%rej allowed before rej whole doc
Example value: "65"
TesseditRejectBlockPercent
%rej allowed before rej whole block
Example value: "45"
TesseditRejectRowPercent
%rej allowed before rej whole row
Example value: "40"
TesseditWholeWdRejRowPercent
Number of row rejects in whole word rejects which prevents whole row rejection
Example value: "70"
TesseditGoodDocStillRowrejWd
rej good doc wd if more than this fraction rejected
Example value: "1.1"
QualityRowrejPc
good_quality_doc gte good char limit
Example value: "1.1"
CrunchTerribleRating
crunch rating lt this
Example value: "80"
CrunchPoorGarbageCert
crunch garbage cert lt this
Example value: "-9"
CrunchPoorGarbageRate
crunch garbage rating lt this
Example value: "60"
CrunchPotPoorRate
POTENTIAL crunch rating lt this
Example value: "40"
CrunchPotPoorCert
POTENTIAL crunch cert lt this
Example value: "-8"
CrunchDelRating
POTENTIAL crunch rating lt this
Example value: "60"
CrunchDelCert
POTENTIAL crunch cert lt this
Example value: "-10"
CrunchDelMinHt
Del if word ht lt xht x this
Example value: "0.7"
CrunchDelMaxHt
Del if word ht gt xht x this
Example value: "3"
CrunchDelMinWidth
Del if word width lt xht x this
Example value: "3"
CrunchDelHighWord
Del if word gt xht x this above bl
Example value: "1.5"
CrunchDelLowWord
Del if word gt xht x this below bl
Example value: "0.5"
CrunchSmallOutlinesSize
Small if lt xht x this
Example value: "0.6"
FixspSmallOutlinesSize
Small if lt xht x this
Example value: "0.28"
SuperscriptWorseCertainty
How many times worse certainty does a superscript position glyph need to be for us to try classifying it as a char with a different baseline?
Example value: "2"
SuperscriptBetteredCertainty
What reduction in badness do we think sufficient to choose a superscript over what we’d thought. For example, a value of 0.6 means we want to reduce badness of certainty by at least 40%
Example value: "0.97"
SuperscriptScaledownRatio
A superscript scaled down more than this is unbelievably small. For example, 0.3 means we expect the font size to be no smaller than 30% of the text line font size.
Example value: "0.4"
SubscriptMaxYTop
Maximum top of a character measured as a multiple of x-height above the baseline for us to reconsider whether it’s a subscript.
Example value: "0.5"
SuperscriptMinYBottom
Minimum bottom of a character measured as a multiple of x-height above the baseline for us to reconsider whether it’s a superscript.
Example value: "0.3"
SuspectRatingPerCh
Don’t touch bad rating limit
Example value: "999.9"
SuspectAcceptRating
Accept good rating limit
Example value: "-999.9"
TesseditLowerFlipHyphen
Aspect ratio dot/hyphen test
Example value: "1.5"
TesseditUpperFlipHyphen
Aspect ratio dot/hyphen test
Example value: "1.8"
RejWholeOfMostlyRejectWordFract
if >this fract
Example value: "0.85"
MinOrientationMargin
Min acceptable orientation margin
Example value: "7"
TextordTabfindVerticalTextRatio
Fraction of textlines deemed vertical to use vertical page mode
Example value: "0.5"
TextordTabfindAlignedGapFraction
Fraction of height used as a minimum gap for aligned blobs.
Example value: "0.75"
TospOldSpKnThFactor
Factor for defining space threshold in terms of space and kern sizes
Example value: "2"
TospThresholdBias1
how far between kern and space?
Example value: "0"
TospThresholdBias2
how far between kern and space?
Example value: "0"
TospNarrowFraction
Fract of xheight for narrow
Example value: "0.3"
TospNarrowAspectRatio
narrow if w/h less than this
Example value: "0.48"
TospWideFraction
Fract of xheight for wide
Example value: "0.52"
TospWideAspectRatio
wide if w/h less than this
Example value: "0"
TospFuzzySpaceFactor
Fract of xheight for fuzz sp
Example value: "0.6"
TospFuzzySpaceFactor1
Fract of xheight for fuzz sp
Example value: "0.5"
TospFuzzySpaceFactor2
Fract of xheight for fuzz sp
Example value: "0.72"
TospGapFactor
gap ratio to flip sp->kern
Example value: "0.83"
TospKernGapFactor1
gap ratio to flip kern->sp
Example value: "2"
TospKernGapFactor2
gap ratio to flip kern->sp
Example value: "1.3"
TospKernGapFactor3
gap ratio to flip kern->sp
Example value: "2.5"
TospIgnoreBigGaps
xht multiplier
Example value: "-1"
TospIgnoreVeryBigGaps
xht multiplier
Example value: "3.5"
TospRepSpace
rep gap multiplier for space
Example value: "1.6"
TospEnoughSmallGaps
Fract of kerns reqd for isolated row stats
Example value: "0.65"
TospTableKnSpRatio
Min difference of kn & sp in table
Example value: "2.25"
TospTableXhtSpRatio
Expect spaces bigger than this
Example value: "0.33"
TospTableFuzzyKnSpRatio
Fuzzy if less than this
Example value: "3"
TospFuzzyKnFraction
New fuzzy kn alg
Example value: "0.5"
TospFuzzySpFraction
New fuzzy sp alg
Example value: "0.5"
TospMinSaneKnSp
Don’t trust spaces less than this time kn
Example value: "1.5"
TospInitGuessKnMult
Thresh guess - mult kn by this
Example value: "2.2"
TospInitGuessXhtMult
Thresh guess - mult xht by this
Example value: "0.28"
TospMaxSaneKnThresh
Multiplier on kn to limit thresh
Example value: "5"
TospFlipCaution
Don’t autoflip kn to sp when large separation
Example value: "0"
TospLargeKerning
Limit use of xht gap with large kns
Example value: "0.19"
TospDontFoolWithSmallKerns
Limit use of xht gap with odd small kns
Example value: "-1"
TospNearLhEdge
Don’t reduce box if the top left is non blank
Example value: "0"
TospSillyKnSpGap
Don’t let sp minus kn get too small
Example value: "0.2"
TospPassWideFuzzSpToContext
How wide fuzzies need context
Example value: "0.75"
TextordNoiseAreaRatio
Fraction of bounding box for noise
Example value: "0.7"
TextordInitialxIle
Ile of sizes for xheight guess
Example value: "0.75"
TextordInitialascIle
Ile of sizes for xheight guess
Example value: "0.9"
TextordNoiseSizelimit
Fraction of x for big t count
Example value: "0.5"
TextordNoiseNormratio
Dot to norm ratio for deletion
Example value: "2"
TextordNoiseSyfract
xh fract height error for norm blobs
Example value: "0.2"
TextordNoiseSxfract
xh fract width error for norm blobs
Example value: "0.4"
TextordNoiseHfract
Height fraction to discard outlines as speckle noise
Example value: "0.015625"
TextordNoiseRowratio
Dot to norm ratio for deletion
Example value: "6"
TextordBlshiftMaxshift
Max baseline shift
Example value: "0"
TextordBlshiftXfraction
Min size of baseline shift
Example value: "9.99"