All Downloads are FREE. Search and download functionalities are using the official Maven repository.

json.schema.metadataIngestion.databaseServiceAutoClassificationPipeline.json Maven / Gradle / Ivy

There is a newer version: 1.6.0-rc1
Show newest version
{
  "$id": "https://open-metadata.org/schema/metadataIngestion/databaseServiceAutoClassificationPipeline.json",
  "$schema": "http://json-schema.org/draft-07/schema#",
  "title": "DatabaseServiceAutoClassificationPipeline",
  "description": "DatabaseService AutoClassification & Auto Classification Pipeline Configuration.",
  "type": "object",
  "definitions": {
    "autoClassificationConfigType": {
      "description": "Profiler Source Config Pipeline type",
      "type": "string",
      "enum": ["AutoClassification"],
      "default": "AutoClassification"
    }
  },
  "properties": {
    "type": {
      "description": "Pipeline type",
      "$ref": "#/definitions/autoClassificationConfigType",
      "default": "AutoClassification"
    },
    "classificationFilterPattern": {
      "description": "Regex to only compute metrics for table that matches the given tag, tiers, gloassary pattern.",
      "$ref": "../type/filterPattern.json#/definitions/filterPattern",
      "title": "Classification Filter Pattern"
    },
    "schemaFilterPattern": {
      "description": "Regex to only fetch tables or databases that matches the pattern.",
      "$ref": "../type/filterPattern.json#/definitions/filterPattern",
      "title": "Schema Filter Pattern"
    },
    "tableFilterPattern": {
      "description": "Regex exclude tables or databases that matches the pattern.",
      "$ref": "../type/filterPattern.json#/definitions/filterPattern",
      "title": "Table Filter Pattern"
    },
    "databaseFilterPattern": {
      "description": "Regex to only fetch databases that matches the pattern.",
      "$ref": "../type/filterPattern.json#/definitions/filterPattern",
      "title": "Database Filter Pattern"
    },
    "includeViews": {
      "description": "Optional configuration to turn off fetching metadata for views.",
      "type": "boolean",
      "default": true,
      "title": "Include Views"
    },
    "useFqnForFiltering": {
      "description": "Regex will be applied on fully qualified name (e.g service_name.db_name.schema_name.table_name) instead of raw name (e.g. table_name)",
      "type": "boolean",
      "default": false,
      "title": "Use FQN For Filtering"
    },
    "storeSampleData": {
      "description": "Option to turn on/off storing sample data. If enabled, we will ingest sample data for each table.",
      "type": "boolean",
      "default": true,
      "title": "Store Sample Data"
    },
    "enableAutoClassification": {
      "description": "Optional configuration to automatically tag columns that might contain sensitive information",
      "type": "boolean",
      "default": false,
      "title": "Enable Auto Classification"
    },
    "confidence": {
      "description": "Set the Confidence value for which you want the column to be tagged as PII. Confidence value ranges from 0 to 100. A higher number will yield less false positives but more false negatives. A lower number will yield more false positives but less false negatives.",
      "type": "number",
      "default": 80,
      "title": "Auto Classification Inference Confidence Level"
    },
    "sampleDataCount": {
      "description": "Number of sample rows to ingest when 'Generate Sample Data' is enabled",
      "type": "integer",
      "default": 50,
      "title": "Sample Data Rows Count"
    }
  },
  "additionalProperties": false
}




© 2015 - 2024 Weber Informatics LLC | Privacy Policy