mHUB - Example Configurations

Here's an example of a simple configuration for mHUB:

<?xml version="1.0" encoding="UTF-8"?>
<settings>
<mode>Matching</mode>

<data>
<input columns="|UniqueRef|FullName|Address1|Address2|Address3|Postcode" />
</data>

<matching>
<keys>
<key>PostOut + NameKey</key>
<key>PhoneticLastName + AddressKey</key>
</keys>
<levels>
<individual minimumScore="80" enabled="true" />
<nameOnly minimumScore="40" enabled="" />
<family minimumScore="80" enabled="" />
<address minimumScore="55" enabled="" />
<business minimumScore="80" enabled="" />
<companyOnly minimumScore="40" enabled="" />
<custom minimumScore="80" enabled="" />
</levels>
<outputs>
<types>
<matchingPairs enabled="" />
<groupedMatchingPairs enabled="" />
<matchingGroups enabled="true" />
<dedupedData enabled="" />
<duplicateData enabled="" />
</types>
<options>
<outputUniqueRefsOnly enabled="true" />
</options>
</outputs>
</matching>

<advanced>
<nationality>USA</nationality>
</advanced>
</settings>

After applying this configuration, mHUB will be configured for Matching at individual level, using two match keys for high data volumes, and will output matching groups of records.

The following chapters detail the contents of the configuration settings.

Omitted from the example are the memory settings, disk settings, and some miscellaneous settings; please refer to the samples\configFull.xml file that's available after installation of the product.

Default values will be used for any settings that are not specified in the configuration.

 

Here is a more complete configuration example to show the arrangement:

<?xml version="1.0" encoding="UTF-8"?>
<settings>
<mode>Matching</mode>

<data>
<input columns="|UniqueRef|FullName|Address1|Address2|Address3|Postcode" />
</data>

<matching>
<keys>
<key>AddressKey+Name1</key>
<key>Name1+PostOut+Premise</key>
<key>PhoneticTown+PhoneticStreet+Premise</key>
</keys>
<levels>
<individual minimumScore="80" enabled="true" />
<nameOnly minimumScore="40" enabled="" />
<family minimumScore="80" enabled="" />
<address minimumScore="55" enabled="" />
<business minimumScore="80" enabled="" />
<companyOnly minimumScore="40" enabled="" />
<custom minimumScore="80" enabled="" />
</levels>
<outputs>
<types>
<matchingPairs enabled="" />
<groupedMatchingPairs enabled="" />
<matchingGroups enabled="true" />
<dedupedData enabled="" />
<duplicateData enabled="" />
</types>
<options>
<outputUniqueRefsOnly enabled="false" />
<outputComponentScores enabled="false" />
<outputExactMatchScores enabled="false" />
<outputAllExactMatches enabled="false" />
<outputLargeClusters enabled="false" records="false" />
</options>
</outputs>
<advanced>
<postMatchingRules>
<rule condition="level(IndividualLevel) and NameScore = 0" action="delete" />
</postMatchingRules>
<bridgingPrevention>
<nameBridgingPrevention enabled="true" />
<prefixBridgingPrevention enabled="true" />
<companyBridgingPrevention enabled="true" />
<aggressiveSplitting enabled="false" />
</bridgingPrevention>
<options>
<outputDeletedMatches enabled="false" />
<outputSubRecords enabled="false" />
</options>
<volume>High</volume>
</advanced>
<maximumClusterSize>200</maximumClusterSize>
<allowBlankKeys>true</allowBlankKeys>
<dynamicKeys>false</dynamicKeys>
</matching>

<threads>0</threads>

<memory>
<inputBufferSize value="1" units="MB" />
<outputBufferSize value="4" units="MB" />
<blockSize value="16" units="KB" />
<cacheLimit value="0" units="GB" />
<threshold value="0" units="GB" />
<compression level="1" />
<encryption enabled="false" keySize="128" />
</memory>
<disk>
<location>C:\WINDOWS\TEMP</location>
<limit value="1" units="TB" />
<compression level="0" />
<encryption enabled="true" keySize="256" />
</disk>

<advanced>
<nationality>USA</nationality>
<matchingRules>
<individualLevel>
<weights>
<name sure="60" likely="40" possible="25" oneEmpty="5" bothEmpty="24"></name>
<organization sure="0" likely="0" possible="0" oneEmpty="0" bothEmpty="0"></organization>
<address sure="40" likely="30" possible="20" oneEmpty="5" bothEmpty="5"></address>
<postcode sure="30" likely="20" possible="15" oneEmpty="5" bothEmpty="5"></postcode>
</weights>
</individualLevel>
</matchingRules>
</advanced>
</settings>