Link Search Menu Expand Document

Data Quality Metric Explanations

preparation quality metrics

CluedIn calculates data quality metrics based off all data that is ingested into the platform. There are many times where you will want a verbose explanation on why a certain data quality score was given. For example, imagine if your had what you think is golden records, but CluedIn gave it very low quality scores - you would want to know exactly why.

The first option is to visualise this explanation within the user inteface by clicking on the “Explain” button when you see a data quality score widget.

The second example would be to get this data from our GraphQL endpoint.

Here is an example that will fetch a detailed explanation of the “Accuracy” metric for Global and Entity Level dimensions.

  metrics
  {
    name
    
    dimensions
    {
      id
      type
      ... on GlobalMetricDimension
      {
        children
        {
          id
        }
      }
      ... on MetricDimension
      {
        valueHistogram
      }
    }
    
    globalLevel: dimension(id : "25118d8c-696e-591f-9eb5-083bff9488d4")
    {
      id
      ... on GlobalMetricDimension
      {
        children
        {
          id
        }
      }
    }
    
    entityLevel: dimension(id: "b545b625-5a9b-5614-ae57-f2c61e02bdb9")
    {
      id
      ... on MetricDimension
      {
        valueHistogram
      }
    }
    
    globalDimension
    {
      id
      latestValue
      parentId
      
      children
      {
        id
        parentId
        type
        detailType
        detail
        providerDefinitionId
        providerId
        providerName
        
#        valueHistogram
        
        entityValues(
          sort: VALUE, 
          sortDirection: ASCENDING,
          cursor: "ewAiAFAAYQBnAGUAIgA6ADUALAAiAFAAYQBnAGUAUwBpAHoAZQAiADoAMgAwAH0A"
        )
        {
          entries
          {
            value
            dimension
            {
              detailType
              latestValue
              children
              {
                detailType
                detail
                latestValue
              }
            }
            entity
            {
              name
              entityType
            }
          }
          cursor
        }
       
        children
        {
        	id
        	parentId
        	type
        	detailType
        	detail
        	providerDefinitionId
        	providerId
        	providerName
          
          valueHistogram
          
          entityValues(sortDirection: ASCENDING)
          {
            entries
            {
              value
            }
            cursor
          }
        }
      }
    }
  }