public class CalculatorFacade extends Object implements Serializable
Modifier and Type | Field and Description |
---|---|
protected PathCache<? extends XmlFieldInstance> |
cache |
protected List<Calculator> |
calculators
The list of registered calculator objects.
|
protected boolean |
checkSkippableCollections |
protected boolean |
collectTfIdfTerms
Flag whether or not collect TF-IDF terms in uniqueness measurement
(default: false).
|
protected CompletenessCalculator |
completenessCalculator
The completeness calculator.
|
protected boolean |
completenessCollectFields
Flag whether or not run missing/empty/existing field collection in
completeness (default: false).
|
protected boolean |
completenessMeasurementEnabled
Flag whether or not run the completeness measurement
(default: true).
|
protected CompressionLevel |
compressionLevel |
protected CsvReader |
csvReader |
protected boolean |
fieldCardinalityMeasurementEnabled
Flag whether or not run the field cardinality measurement
(default: true).
|
protected boolean |
fieldExistenceMeasurementEnabled
Flag whether or not run the field existence measurement
(default: true).
|
protected FieldExtractor |
fieldExtractor
The field extractor object.
|
protected boolean |
fieldExtractorEnabled
Flag whether or not the field extractor is enabled (default: false).
|
protected Format |
format |
protected LanguageCalculator |
languageCalculator
The language detector.
|
protected boolean |
languageMeasurementEnabled
Flag whether or not run the language detector
(default: false).
|
protected MultilingualitySaturationCalculator |
multilingualSaturationCalculator
The language detector.
|
protected boolean |
multilingualSaturationMeasurementEnabled
Flag whether or not run the multilingual saturation measurement
(default: false).
|
protected boolean |
problemCatalogMeasurementEnabled
Flag whether or not run the problem catalog
(default: false).
|
protected boolean |
ruleCatalogMeasurementEnabled
Flag whether or not run the rule catalog
(default: false).
|
protected boolean |
saturationExtendedResult |
protected Schema |
schema |
protected SolrClient |
solrClient |
protected SolrConfiguration |
solrConfiguration |
protected TfIdfCalculator |
tfidfCalculator
The TF-IDF calculator.
|
protected boolean |
tfIdfMeasurementEnabled
Flag whether or not run the uniqueness measurement
(default: false).
|
protected boolean |
uniquenessMeasurementEnabled |
Constructor and Description |
---|
CalculatorFacade()
Create calculator facade with the default configuration.
|
CalculatorFacade(boolean runFieldExistence,
boolean runFieldCardinality,
boolean runCompleteness,
boolean runTfIdf,
boolean runProblemCatalog)
Create calculator facade with configuration.
|
Modifier and Type | Method and Description |
---|---|
boolean |
collectTfIdfTerms()
Returns the flag whether the measurement should collect each individual
terms with their Term Ferquency and Invers Document Frequency scores.
|
CalculatorFacade |
collectTfIdfTerms(boolean collectTfIdfTerms)
Sets the flag whether the measurement should collect each individual
terms with their Term Ferquency and Invers Document Frequency scores.
|
boolean |
completenessCollectFields()
Get the completenessCollectFields flag.
|
CalculatorFacade |
completenessCollectFields(boolean completenessCollectFields)
The completeness calculation will collect empty, existent and missing fields.
|
protected void |
conditionalConfiguration() |
void |
configure()
Run the configuration based on the previously set flags.
|
CalculatorFacade |
configureSolr(String solrHost,
String solrPort,
String solrPath) |
CalculatorFacade |
disableCompletenessMeasurement() |
CalculatorFacade |
disableFieldCardinalityMeasurement() |
CalculatorFacade |
disableFieldExistenceMeasurement() |
CalculatorFacade |
disableFieldExtractor() |
CalculatorFacade |
disableLanguageMeasurement() |
CalculatorFacade |
disableMultilingualSaturationMeasurement() |
CalculatorFacade |
disableProblemCatalogMeasurement() |
CalculatorFacade |
disableRuleCatalogMeasurement() |
CalculatorFacade |
disableTfIdfMeasurement() |
CalculatorFacade |
disableUniquenessMeasurement() |
CalculatorFacade |
enableCompletenessMeasurement() |
CalculatorFacade |
enableCompletenessMeasurement(boolean runCompleteness)
Sets the flag whether or not run the completeness measurement.
|
CalculatorFacade |
enableFieldCardinalityMeasurement() |
CalculatorFacade |
enableFieldCardinalityMeasurement(boolean runFieldCardinality)
configure to run the cardinality measurement.
|
CalculatorFacade |
enableFieldExistenceMeasurement() |
CalculatorFacade |
enableFieldExistenceMeasurement(boolean runFieldExistence)
Sets whether or not to run the field existence measurement.
|
CalculatorFacade |
enableFieldExtractor() |
CalculatorFacade |
enableFieldExtractor(boolean flag) |
CalculatorFacade |
enableLanguageMeasurement() |
CalculatorFacade |
enableLanguageMeasurement(boolean runLanguage)
Configure whether or not run the language detector.
|
CalculatorFacade |
enableMultilingualSaturationMeasurement() |
CalculatorFacade |
enableMultilingualSaturationMeasurement(boolean runMultilingualSaturation)
Configure whether or not run the language detector.
|
CalculatorFacade |
enableProblemCatalogMeasurement() |
CalculatorFacade |
enableProblemCatalogMeasurement(boolean runProblemCatalog)
Configure to run the problem catalog measurement.
|
CalculatorFacade |
enableRuleCatalogMeasurement() |
CalculatorFacade |
enableRuleCatalogMeasurement(boolean run)
Configure to run the problem catalog measurement.
|
CalculatorFacade |
enableTfIdfMeasurement() |
CalculatorFacade |
enableTfIdfMeasurement(boolean runTfIdf)
Configure whether or not run the uniqueness measurement.
|
CalculatorFacade |
enableUniquenessMeasurement() |
CalculatorFacade |
enableUniquenessMeasurement(boolean uniquenessMeasurementEnabled)
Flag to enable uniqueness measurement.
|
PathCache<? extends XmlFieldInstance> |
getCache() |
List<Calculator> |
getCalculators()
Return the list of all registered calculators.
|
CompressionLevel |
getCompressionLevel() |
String |
getCsv(boolean withLabels,
CompressionLevel compressionLevel) |
List<String> |
getEmptyFields()
Returns the list of empty fields.
|
List<String> |
getExistingFields()
Returns the list of existing fields.
|
List<String> |
getHeader() |
Map<String,Map<String,? extends Object>> |
getLabelledResults() |
List<String> |
getMissingFields()
Returns the list of missing fields.
|
Map<String,Object> |
getResults()
Returns the result map.
|
Schema |
getSchema() |
Map<String,List<TfIdf>> |
getTermsCollection()
Returns the TF-IDF term map.
|
boolean |
isCheckSkippableCollections() |
boolean |
isCompletenessMeasurementEnabled()
Returns the flag whether or not run the completeness measurement.
|
boolean |
isFieldCardinalityMeasurementEnabled()
Returns whether or not to run cardinality measurement.
|
boolean |
isFieldExistenceMeasurementEnabled()
Returns whether or not to run the field existence measurement.
|
boolean |
isFieldExtractorEnabled() |
boolean |
isLanguageMeasurementEnabled()
Returns the flag whether or not run the language detector.
|
boolean |
isMultilingualSaturationMeasurementEnabled()
Returns the flag whether or not run the language detector.
|
boolean |
isProblemCatalogMeasurementEnabled()
Gets flag whether to run the problem catalog measurement.
|
boolean |
isRuleCatalogMeasurementEnabled()
Gets flag whether to run the rule catalog measurement.
|
boolean |
isSaturationExtendedResult() |
boolean |
isTfIdfMeasurementEnabled()
Returns whether or not run the uniqueness measurement.
|
boolean |
isUniquenessMeasurementEnabled()
Is uniqueness measurement enabled?
|
String |
measure(String jsonRecord)
Run the measurements with each Calculator then returns the result as CSV.
|
List<String> |
measureAsList(String jsonRecord) |
Map<String,Object> |
measureAsMap(String jsonRecord) |
protected <T extends XmlFieldInstance> |
measureWithGenerics(String content)
The generic version of measure.
|
protected <T extends XmlFieldInstance> |
measureWithGenerics(String content,
Class outputClass) |
CalculatorFacade |
setCheckSkippableCollections(boolean checkSkippableCollections) |
CalculatorFacade |
setCompressionLevel(CompressionLevel compressionLevel) |
CalculatorFacade |
setCsvReader(CsvReader csvReader) |
CalculatorFacade |
setSaturationExtendedResult(boolean saturationExtendedResult) |
CalculatorFacade |
setSchema(Schema schema) |
CalculatorFacade |
setSolrClient(SolrClient solrClient) |
protected boolean fieldExtractorEnabled
protected boolean fieldExistenceMeasurementEnabled
protected boolean fieldCardinalityMeasurementEnabled
protected boolean completenessMeasurementEnabled
protected boolean tfIdfMeasurementEnabled
protected boolean problemCatalogMeasurementEnabled
protected boolean ruleCatalogMeasurementEnabled
protected boolean languageMeasurementEnabled
protected boolean multilingualSaturationMeasurementEnabled
protected boolean collectTfIdfTerms
protected boolean completenessCollectFields
protected boolean saturationExtendedResult
protected boolean checkSkippableCollections
protected boolean uniquenessMeasurementEnabled
protected CompressionLevel compressionLevel
protected SolrClient solrClient
protected SolrConfiguration solrConfiguration
protected List<Calculator> calculators
protected FieldExtractor fieldExtractor
protected CompletenessCalculator completenessCalculator
protected TfIdfCalculator tfidfCalculator
protected LanguageCalculator languageCalculator
protected MultilingualitySaturationCalculator multilingualSaturationCalculator
protected Format format
protected PathCache<? extends XmlFieldInstance> cache
protected Schema schema
protected CsvReader csvReader
public CalculatorFacade()
public CalculatorFacade(boolean runFieldExistence, boolean runFieldCardinality, boolean runCompleteness, boolean runTfIdf, boolean runProblemCatalog)
runFieldExistence
- Flag whether or not run the field existence measurementrunFieldCardinality
- Flag whether or not run the field cardinality measurementrunCompleteness
- Flag whether or not run the completeness measurementrunTfIdf
- Flag whether or not run the uniqueness measurementrunProblemCatalog
- Flag whether or not run the problem catalogprotected void conditionalConfiguration()
public void configure()
public String measure(String jsonRecord) throws com.jayway.jsonpath.InvalidJsonException
jsonRecord
- The JSON record stringcom.jayway.jsonpath.InvalidJsonException
- Invalid Json exceptionpublic List<String> measureAsList(String jsonRecord) throws com.jayway.jsonpath.InvalidJsonException
com.jayway.jsonpath.InvalidJsonException
public Map<String,Object> measureAsMap(String jsonRecord) throws com.jayway.jsonpath.InvalidJsonException
com.jayway.jsonpath.InvalidJsonException
protected <T extends XmlFieldInstance> Object measureWithGenerics(String content) throws com.jayway.jsonpath.InvalidJsonException
T
- A class defining the internal representation of a field. It should be
an extension of XmlFieldInstancecontent
- The JSON recordcom.jayway.jsonpath.InvalidJsonException
protected <T extends XmlFieldInstance> Object measureWithGenerics(String content, Class outputClass) throws com.jayway.jsonpath.InvalidJsonException
com.jayway.jsonpath.InvalidJsonException
public CalculatorFacade enableFieldExtractor()
public CalculatorFacade disableFieldExtractor()
public CalculatorFacade enableFieldExtractor(boolean flag)
public boolean isFieldExtractorEnabled()
public boolean isFieldExistenceMeasurementEnabled()
public CalculatorFacade enableFieldExistenceMeasurement()
public CalculatorFacade disableFieldExistenceMeasurement()
public CalculatorFacade enableFieldExistenceMeasurement(boolean runFieldExistence)
runFieldExistence
- field existence measurement flagpublic boolean isFieldCardinalityMeasurementEnabled()
public CalculatorFacade enableFieldCardinalityMeasurement()
public CalculatorFacade disableFieldCardinalityMeasurement()
public CalculatorFacade enableFieldCardinalityMeasurement(boolean runFieldCardinality)
runFieldCardinality
- cardinality measurement flagpublic boolean isCompletenessMeasurementEnabled()
public CalculatorFacade enableCompletenessMeasurement()
public CalculatorFacade disableCompletenessMeasurement()
public CalculatorFacade enableCompletenessMeasurement(boolean runCompleteness)
runCompleteness
- flag whether or not run the completeness measurementpublic boolean isLanguageMeasurementEnabled()
public CalculatorFacade enableLanguageMeasurement()
public CalculatorFacade disableLanguageMeasurement()
public CalculatorFacade enableLanguageMeasurement(boolean runLanguage)
runLanguage
- public boolean isMultilingualSaturationMeasurementEnabled()
public CalculatorFacade enableMultilingualSaturationMeasurement()
public CalculatorFacade disableMultilingualSaturationMeasurement()
public CalculatorFacade enableMultilingualSaturationMeasurement(boolean runMultilingualSaturation)
runMultilingualSaturation
- public boolean isTfIdfMeasurementEnabled()
public CalculatorFacade enableTfIdfMeasurement()
public CalculatorFacade disableTfIdfMeasurement()
public CalculatorFacade enableTfIdfMeasurement(boolean runTfIdf)
runTfIdf
- uniqueness measurement flagpublic boolean isProblemCatalogMeasurementEnabled()
public CalculatorFacade enableProblemCatalogMeasurement()
public CalculatorFacade disableProblemCatalogMeasurement()
public CalculatorFacade enableProblemCatalogMeasurement(boolean runProblemCatalog)
runProblemCatalog
- problem catalog measurement flagpublic boolean isRuleCatalogMeasurementEnabled()
public CalculatorFacade enableRuleCatalogMeasurement()
public CalculatorFacade disableRuleCatalogMeasurement()
public CalculatorFacade enableRuleCatalogMeasurement(boolean run)
run
- problem catalog measurement flagpublic boolean isUniquenessMeasurementEnabled()
public CalculatorFacade enableUniquenessMeasurement()
public CalculatorFacade disableUniquenessMeasurement()
public CalculatorFacade enableUniquenessMeasurement(boolean uniquenessMeasurementEnabled)
uniquenessMeasurementEnabled
- The flagpublic List<Calculator> getCalculators()
public boolean collectTfIdfTerms()
public CalculatorFacade collectTfIdfTerms(boolean collectTfIdfTerms)
collectTfIdfTerms
- The TF-IDF collector flagpublic boolean completenessCollectFields()
public CalculatorFacade completenessCollectFields(boolean completenessCollectFields)
completenessCollectFields
- The completenessCollectFields flagpublic List<String> getExistingFields()
public List<String> getEmptyFields()
public List<String> getMissingFields()
public Map<String,List<TfIdf>> getTermsCollection()
TfIdfCalculator.getTermsCollection()
public Map<String,Object> getResults()
Counters.getResults()
public String getCsv(boolean withLabels, CompressionLevel compressionLevel)
public CalculatorFacade configureSolr(String solrHost, String solrPort, String solrPath)
public boolean isSaturationExtendedResult()
public CalculatorFacade setSaturationExtendedResult(boolean saturationExtendedResult)
public CompressionLevel getCompressionLevel()
public CalculatorFacade setCompressionLevel(CompressionLevel compressionLevel)
public PathCache<? extends XmlFieldInstance> getCache()
public boolean isCheckSkippableCollections()
public CalculatorFacade setCheckSkippableCollections(boolean checkSkippableCollections)
public Schema getSchema()
public CalculatorFacade setSchema(Schema schema)
public CalculatorFacade setSolrClient(SolrClient solrClient)
public CalculatorFacade setCsvReader(CsvReader csvReader)
Copyright © 2020. All rights reserved.