reference.plugins.json Maven / Gradle / Ivy
Go to download
Show more of this group Show more artifacts with this name
Show all versions of fta Show documentation
Show all versions of fta Show documentation
Analyze Text data to determine simple type and Semantic type information as well as other key metrics associated with a text stream.
[
{
"semanticType": "EMAIL",
"description": "Email Address",
"pluginType": "java",
"signature": "+A0AMjgeFlGRlPKsX/iXYmoWpfY=",
"clazz": "com.cobber.fta.plugins.EmailLT",
"validLocales": [
{ "localeTag": "*", "headerRegExps": [ { "regExp": ".*(?i)(email|e-mail|e_mail).*", "confidence": 90 } ] },
{ "localeTag": "es", "headerRegExps": [ { "regExp": ".*(?i)(correo|email|e-mail|e_mail).*", "confidence": 90 } ] }
],
"documentation": [
{ "source": "wikidata", "reference": "https://www.wikidata.org/wiki/Property:P968" },
{ "source": "wikipedia", "reference": "https://https://en.wikipedia.org/wiki/Email_address" },
{ "source": "schema", "reference": "https://schema.org/email" }
],
"priority": 10
},
{
"semanticType": "URI.URL",
"description": "URL - see RFC 3986",
"pluginType": "java",
"signature": "r+muJMmeRDtmg9qyVbWCOAMusc8=",
"clazz": "com.cobber.fta.plugins.URLLT",
"validLocales": [ { "localeTag": "*", "headerRegExps": [ { "regExp": ".*(?i)(url|web).*", "confidence": 90 } ] } ],
"documentation": [
{ "source": "wikidata", "reference": "https://www.wikidata.org/wiki/Property:P2699" },
{ "source": "wikipedia", "reference": "https://en.wikipedia.org/wiki/Uniform_Resource_Identifier" },
{ "source": "schema", "reference": "https://schema.org/url" }
],
"priority": 15
},
{
"semanticType": "IPADDRESS.IPV4",
"description": "IP V4 Address",
"pluginType": "java",
"signature": "tjKmv3C98nzoxPHtvYb1sp+UQEY=",
"clazz": "com.cobber.fta.plugins.IPV4Address",
"validLocales": [ { "localeTag": "*", "headerRegExps": [ { "regExp": ".*(?i)(ip).*", "confidence": 70 } ] } ],
"documentation": [
{ "source": "wikidata", "reference": "https://www.wikidata.org/wiki/Property:P511" },
{ "source": "wikipedia", "reference": "https://en.wikipedia.org/wiki/Internet_Protocol_version_4" }
],
"threshold": 99,
"priority": 20
},
{
"semanticType": "IPADDRESS.IPV6",
"description": "IP V6 Address",
"pluginType": "java",
"signature": "UCm9KlNKo0Hv4BULLB3qSWbMQHY=",
"clazz": "com.cobber.fta.plugins.IPV6Address",
"validLocales": [ { "localeTag": "*", "headerRegExps": [ { "regExp": ".*(?i)(ip).*", "confidence": 70 } ] } ],
"documentation": [
{ "source": "wikidata", "reference": "https://www.wikidata.org/wiki/Property:P511" },
{ "source": "wikipedia", "reference": "https://en.wikipedia.org/wiki/IPv6" }
],
"threshold": 99,
"priority": 25
},
{
"semanticType": "TELEPHONE",
"description": "Telephone Number (Generic)",
"pluginType": "java",
"signature": "YOwAVZnoqmDtMa0wUtlF+Mda69U=",
"clazz": "com.cobber.fta.plugins.PhoneNumberLT",
"validLocales": [ { "localeTag": "*", "headerRegExps": [ { "regExp": ".*(?i)(?u)(phone|fax|mobile|cell|contact.?number|mobiel|móvil|movil|telephone|telefono|telefon|telefoon|téléphone|телефон|Факс|τηλέφωνο|電話).*", "confidence": 98 } ] } ],
"documentation": [
{ "source": "wikidata", "reference": "https://www.wikidata.org/wiki/Property:P1329" },
{ "source": "wikipedia", "reference": "https://en.wikipedia.org/wiki/Telephone_number" },
{ "source": "schema", "reference": "https://schema.org/telephone" }
],
"baseType": "STRING",
"priority": 40
},
{
"semanticType": "GUID",
"description": "Globally Unique Identifier, e.g. 30DD879E-FE2F-11DB-8314-9800310C9A67",
"pluginType": "java",
"signature": "AtovlR1okrAJUeTCpYUUTXow4yM=",
"clazz": "com.cobber.fta.plugins.GUID",
"validLocales": [
{ "localeTag": "*", "headerRegExps": [ { "regExp": ".*(?i)(guid).*", "confidence": 99 } ] }
],
"documentation": [
{ "source": "wikidata", "reference": "https://www.wikidata.org/wiki/Q254972" },
{ "source": "wikipedia", "reference": "https://en.wikipedia.org/wiki/Universally_unique_identifier" }
],
"threshold": 99,
"priority": 50
},
{
"semanticType": "VIN",
"description": "Vehicle Identification Number",
"pluginType": "java",
"signature": "JLD6IQMMMoQZTZH7OyHsGRuSoTQ=",
"clazz": "com.cobber.fta.plugins.VIN",
"validLocales": [ { "localeTag": "*" } ],
"documentation": [
{ "source": "wikidata", "reference": "https://www.wikidata.org/wiki/Property:P6322" },
{ "source": "wikipedia", "reference": "https://en.wikipedia.org/wiki/Vehicle_identification_number" }
],
"threshold": 98,
"priority": 51
},
{
"semanticType": "POSTAL_CODE.ZIP5_US",
"description": "Postal Code (US)",
"pluginType": "java",
"signature": "/o1vxOzeSy+OB/GwjvwcCCv6ri0=",
"clazz": "com.cobber.fta.plugins.address.USZip5",
"validLocales": [
{ "localeTag": "en-US,en-Latn-US,en-CA,fr-CA",
"headerRegExps": [ { "regExp": ".*(?i)(zip|postal|postcode).*", "confidence": 95 }, { "regExp": "(?i).*fips.*", "confidence": -100 } ] }
],
"documentation": [
{ "source": "wikidata", "reference": "https://www.wikidata.org/wiki/Property:P281" },
{ "source": "wikipedia", "reference": "https://en.wikipedia.org/wiki/ZIP_Code" },
{ "source": "schema", "reference": "https://schema.org/postalCode" }
],
"baseType": "STRING",
"threshold": 90,
"priority": 60
},
{
"semanticType": "POSTAL_CODE.ZIP5_PLUS4_US",
"description": "Postal Code + 4 (US)",
"pluginType": "java",
"signature": "97eQHR8swSv5+VyCVyYDNayMdy4=",
"clazz": "com.cobber.fta.plugins.address.USZipPlus4",
"validLocales": [
{ "localeTag": "en-US,en-CA,fr-CA", "headerRegExps": [ { "regExp": ".*(?i)(zip|postal|postcode).*", "confidence": 95 }, { "regExp": "(?i).*fips.*", "confidence": -100 } ] }
],
"documentation": [
{ "source": "wikidata", "reference": "https://www.wikidata.org/wiki/Property:P281" },
{ "source": "wikipedia", "reference": "https://en.wikipedia.org/wiki/ZIP_Code" },
{ "source": "schema", "reference": "https://schema.org/postalCode" }
],
"threshold": 90,
"priority": 61
},
{
"semanticType": "POSTAL_CODE.POSTAL_CODE_UK",
"description": "Postal Code (UK)",
"pluginType": "java",
"signature": "0m+ny+TVuhGGP1RGw3XKoni4Qyo=",
"clazz": "com.cobber.fta.plugins.address.PostalCodeUK",
"validLocales": [ { "localeTag": "en-GB,en-UK" } ],
"documentation": [
{ "source": "wikipedia", "reference": "https://en.wikipedia.org/wiki/Postcodes_in_the_United_Kingdom" },
{ "source": "schema", "reference": "https://schema.org/postalCode" }
],
"priority": 62
},
{
"semanticType": "POSTAL_CODE.POSTAL_CODE_CA",
"description": "Postal Code (CA)",
"pluginType": "java",
"signature": "PJdCrn71buwdG4wyhlOpLSrc1+M=",
"clazz": "com.cobber.fta.plugins.address.PostalCodeCA",
"validLocales": [
{
"localeTag": "en-US,en-CA,fr-CA",
"headerRegExps": [ { "regExp": ".*(?i)(post|zip).*", "confidence": 99, "mandatory": true } ]
}
],
"documentation": [
{ "source": "wikidata", "reference": "https://www.wikidata.org/wiki/Property:P281" },
{ "source": "wikipedia", "reference": "https://en.wikipedia.org/wiki/Postal_codes_in_Canada" },
{ "source": "schema", "reference": "https://schema.org/postalCode" }
],
"threshold": 95,
"baseType": "STRING",
"priority": 63
},
{
"semanticType": "POSTAL_CODE.POSTAL_CODE_AU",
"description": "Postal Code (AU)",
"pluginType": "regex",
"signature": "GGcrawbIPrKWkNlGg2vaccl1MNY=",
"validLocales": [
{
"localeTag": "en-AU",
"headerRegExps": [ { "regExp": ".*(?i)(post).*", "confidence": 99, "mandatory": true } ],
"matchEntries": [ {
"regExpReturned": "\\d{4}"
} ]
}
],
"documentation": [
{ "source": "wikidata", "reference": "https://www.wikidata.org/wiki/Property:P281" },
{ "source": "wikipedia", "reference": "https://en.wikipedia.org/wiki/Postcodes_in_Australia" },
{ "source": "schema", "reference": "https://schema.org/postalCode" }
],
"threshold": 98,
"baseType": "LONG",
"priority": 64
},
{
"semanticType": "POSTAL_CODE.POSTAL_CODE_NL",
"description": "Postal Code (NL)",
"pluginType": "regex",
"signature": "zPoRG8ivy1ZRtQmx2dYu/pc6Prk=",
"validLocales": [
{
"localeTag": "en-NL,nl-NL",
"headerRegExps": [ { "regExp": ".*(?i)(post).*", "confidence": 95 }, { "regExp": ".*(?i)(code).*", "confidence": 75 } ],
"matchEntries": [
{
"regExpReturned": "\\d{4} \\p{IsAlphabetic}{2}|\\d{4}\\p{IsAlphabetic}{2}"
}
]
}
],
"documentation": [
{ "source": "wikidata", "reference": "https://www.wikidata.org/wiki/Property:P281" },
{ "source": "wikipedia", "reference": "https://en.wikipedia.org/wiki/Postal_codes_in_the_Netherlands" },
{ "source": "schema", "reference": "https://schema.org/postalCode" }
],
"threshold": 95,
"baseType": "STRING",
"priority": 65
},
{
"semanticType": "POSTAL_CODE.POSTAL_CODE_FR",
"description": "Postal Code (FR)",
"pluginType": "java",
"signature": "NBx2UhY9b1E8PKjEPXxorgBew1s=",
"clazz": "com.cobber.fta.plugins.address.PostalCodeFR",
"validLocales": [
{
"localeTag": "fr-FR",
"headerRegExps": [ { "regExp": ".*(?i)(code.postal|cp).*", "confidence": 95 } ]
} ],
"documentation": [
{ "source": "wikidata", "reference": "https://www.wikidata.org/wiki/Property:P281" },
{ "source": "wikipedia", "reference": "https://en.wikipedia.org/wiki/Postal_codes_in_France" },
{ "source": "schema", "reference": "https://schema.org/postalCode" }
],
"baseType": "LONG",
"threshold": 98,
"priority": 66
},
{
"semanticType": "POSTAL_CODE.POSTAL_CODE_JA",
"description": "Postal Code (JA)",
"pluginType": "java",
"signature": "90grIf//XH2xAcARIKYJPzmfhJg=",
"clazz": "com.cobber.fta.plugins.address.PostalCodeJA",
"validLocales": [ { "localeTag": "ja" } ],
"documentation": [
{ "source": "wikidata", "reference": "https://www.wikidata.org/wiki/Property:P281" },
{ "source": "wikipedia", "reference": "https://en.wikipedia.org/wiki/Postal_codes_in_Japan" },
{ "source": "schema", "reference": "https://schema.org/postalCode" }
],
"priority": 67
},
{
"semanticType": "POSTAL_CODE.POSTAL_CODE_PT",
"description": "Postal Code (PT)",
"pluginType": "regex",
"signature": "YOwVZiE8O4fMUH/RJ/34zgxi0yg=",
"validLocales": [
{
"localeTag": "pt-PT",
"headerRegExps": [ { "regExp": ".*(?i)(?u)(código.postal).*", "confidence": 95, "mandatory": true } ],
"matchEntries": [ {
"regExpReturned": "\\d{4}-\\d{3}"
} ]
}
],
"documentation": [
{ "source": "wikidata", "reference": "https://www.wikidata.org/wiki/Property:P281" },
{ "source": "wikipedia", "reference": "https://en.wikipedia.org/wiki/Postal_codes_in_Portugal" },
{ "source": "schema", "reference": "https://schema.org/postalCode" }
],
"threshold": 99,
"baseType": "STRING",
"priority": 68
},
{
"semanticType": "POSTAL_CODE.POSTAL_CODE_DE",
"description": "Postal Code (DE)",
"pluginType": "list",
"signature": "7Q/NP19OT3uFsdQkhdDLsBJdZck=",
"validLocales": [
{ "localeTag": "de-DE", "headerRegExps": [ { "regExp": ".*(?i)(postleitzahl|zip|plz).*", "confidence": 99, "mandatory": true } ] }
],
"content": {
"type": "resource",
"reference": "/reference/de_postal_code.csv"
},
"documentation": [
{ "source": "wikidata", "reference": "https://www.wikidata.org/wiki/Property:P281" },
{ "source": "wikipedia", "reference": "https://en.wikipedia.org/wiki/Postal_codes_in_Germany" },
{ "source": "schema", "reference": "https://schema.org/postalCode" }
],
"threshold": 99,
"baseType": "LONG",
"backout": "\\d{5}",
"priority": 69
},
{
"semanticType": "POSTAL_CODE.POSTAL_CODE_ES",
"description": "Postal Code (ES)",
"pluginType": "list",
"signature": "wme+qdk/tsdr4Fb4qfCyAaicpmE=",
"validLocales": [
{ "localeTag": "es-ES", "headerRegExps": [ { "regExp": ".*(?i)(postal).*", "confidence": 95, "mandatory": true } ] }
],
"content": {
"type": "resource",
"reference": "/reference/es_postal_code.csv"
},
"documentation": [
{ "source": "wikidata", "reference": "https://www.wikidata.org/wiki/Property:P281" },
{ "source": "wikipedia", "reference": "https://en.wikipedia.org/wiki/Postal_codes_in_Spain" },
{ "source": "schema", "reference": "https://schema.org/postalCode" }
],
"threshold": 99,
"baseType": "LONG",
"backout": "\\d{5}",
"priority": 70
},
{
"semanticType": "POSTAL_CODE.POSTAL_CODE_SE",
"description": "Postal Code (SE)",
"pluginType": "java",
"signature": "pfVf2x3vraje4ycWyo87F5A6e38=",
"clazz": "com.cobber.fta.plugins.address.PostalCodeSE",
"validLocales": [
{ "localeTag": "sv-SE", "headerRegExps": [ { "regExp": ".*(?i)(postnummer).*", "confidence": 99 } ] }
],
"documentation": [
{ "source": "wikidata", "reference": "https://www.wikidata.org/wiki/Property:P281" },
{ "source": "wikipedia", "reference": "https://en.wikipedia.org/wiki/Postal_codes_in_Sweden" },
{ "source": "schema", "reference": "https://schema.org/postalCode" }
],
"threshold": 99,
"baseType": "STRING",
"priority": 71
},
{
"semanticType": "POSTAL_CODE.POSTAL_CODE_UY",
"description": "Postal Code (UY)",
"pluginType": "list",
"signature": "bGHgk5RMF4mqRw5xkTxm8AdUMxg=",
"validLocales": [
{ "localeTag": "es-UY", "headerRegExps": [ { "regExp": ".*(?i)(codigo.*postal).*", "confidence": 99 } ] }
],
"content": {
"type": "resource",
"reference": "/reference/uy_postal_code.csv"
},
"documentation": [
{ "source": "wikidata", "reference": "https://www.wikidata.org/wiki/Property:P281" },
{ "source": "schema", "reference": "https://schema.org/postalCode" }
],
"threshold": 99,
"baseType": "LONG",
"backout": "\\d{5}",
"priority": 72
},
{
"semanticType": "POSTAL_CODE.POSTAL_CODE_MX",
"description": "Postal Code (MX)",
"pluginType": "java",
"signature": "z0MBnHNCyrDo8blnBUAqjNDVwdw=",
"clazz": "com.cobber.fta.plugins.address.PostalCodeMX",
"validLocales": [
{ "localeTag": "es-MX", "headerRegExps": [ { "regExp": ".*(?i)(c.digo.*postal).*", "confidence": 99 } ] }
],
"documentation": [
{ "source": "wikidata", "reference": "https://www.wikidata.org/wiki/Property:P281" },
{ "source": "wikipedia", "reference": "https://en.wikipedia.org/wiki/Postal_codes_in_Mexico" },
{ "source": "schema", "reference": "https://schema.org/postalCode" }
],
"threshold": 99,
"baseType": "LONG",
"priority": 73
},
{
"semanticType": "POSTAL_CODE.POSTAL_CODE_BG",
"description": "Postal Code (BG)",
"pluginType": "list",
"signature": "vf445LWLa0dN+AZtiaxv3WlOrDc=",
"validLocales": [
{ "localeTag": "bg-BG", "headerRegExps": [ { "regExp": ".*(?i)(Пощ код|Пощенски код).*", "confidence": 99 } ] }
],
"content": {
"type": "resource",
"reference": "/reference/bg_postal_code.csv"
},
"documentation": [
{ "source": "wikidata", "reference": "https://www.wikidata.org/wiki/Property:P281" },
{ "source": "wikipedia", "reference": "https://en.wikipedia.org/wiki/Postal_codes_in_Bulgaria" },
{ "source": "schema", "reference": "https://schema.org/postalCode" }
],
"threshold": 99,
"baseType": "LONG",
"backout": "\\d{4}",
"priority": 74
},
{
"semanticType": "POSTAL_CODE.POSTAL_CODE_CO",
"description": "Postal Code (CO)",
"pluginType": "java",
"signature": "nb4TdG9sqJZTuLyvoOUywb1lA4s=",
"clazz": "com.cobber.fta.plugins.address.PostalCodeCO",
"validLocales": [
{
"localeTag": "es-CO",
"headerRegExps": [ { "regExp": ".*(?i)(codigo.postal).*", "confidence": 95 }, { "regExp": ".*(?i)(postal).*", "confidence": 85 } ]
} ],
"documentation": [
{ "source": "wikidata", "reference": "https://www.wikidata.org/wiki/Property:P281" },
{ "source": "wikipedia", "reference": "https://en.wikipedia.org/wiki/Postal_codes_in_Colombia" },
{ "source": "schema", "reference": "https://schema.org/postalCode" }
],
"baseType": "LONG",
"threshold": 98,
"priority": 75
},
{
"semanticType": "FULL_ADDRESS_EN",
"description": "Full Address (English Language)",
"pluginType": "java",
"signature": "CJFV+VSRgkE9qJFlqdfK5nVpYCM=",
"clazz": "com.cobber.fta.plugins.address.AddressFullEN",
"validLocales": [
{ "localeTag": "en-CA,en-US", "headerRegExps": [ { "regExp": ".*(?i)(address)", "confidence": 99 }, { "regExp": ".*(?i)(addr|location).*", "confidence": 95 } ] }
],
"threshold": 90,
"priority": 80
},
{
"semanticType": "STREET_ADDRESS_EN",
"description": "Street Address (English Language)",
"pluginType": "java",
"signature": "5P7tWzPdbjVvyHhLklpTf00Zxl8=",
"clazz": "com.cobber.fta.plugins.address.AddressEN",
"validLocales": [
{ "localeTag": "en", "headerRegExps": [ { "regExp": "(?i).*(address|addr)(.*1)?", "confidence": 99 }, { "regExp": ".*(?i)(addr).*", "confidence": 95 }, { "regExp": ".*(?i)(street|location).*", "confidence": 85 } ] }
],
"threshold": 90,
"priority": 81
},
{
"semanticType": "STREET_NAME_EN",
"description": "Street Name (English Language)",
"pluginType": "java",
"signature": "3E5oqYqSkuXljmmvAl47bS8ywxM=",
"clazz": "com.cobber.fta.plugins.address.AddressStreetNameEN",
"validLocales": [
{ "localeTag": "en", "headerRegExps": [ { "regExp": "(?i)(street|road).?name", "confidence": 99 }, { "regExp": "(?i)(street|road)", "confidence": 95 }, { "regExp": ".*(?i)(street|road).*", "confidence": 90 }, { "regExp": ".*(?i)(location).*", "confidence": 85 } ] }
],
"threshold": 90,
"priority": 82
},
{
"semanticType": "STREET_NAME_BARE_EN",
"description": "Street Name - no Marker (English Language)",
"pluginType": "java",
"signature": "f4aT7BMSi+IsDI0LannEVYe/uQI=",
"clazz": "com.cobber.fta.plugins.address.AddressStreetNameBareEN",
"validLocales": [
{ "localeTag": "en", "headerRegExps": [ { "regExp": "(?i).*(street|road).?name", "confidence": 99, "mandatory": true }, { "regExp": "(?i).*(name|street)", "confidence": 60, "mandatory": true } ] }
],
"threshold": 90,
"priority": 83
},
{
"semanticType": "STREET_MARKER_EN",
"description": "Street Marker (English Language)",
"pluginType": "list",
"signature": "whIM9TwB3ArMA50gXTlOBjNCFJk=",
"validLocales": [
{ "localeTag": "en", "headerRegExps": [ { "regExp": ".*(?i)(street).*", "confidence": 90 } ] }
],
"content": {
"type": "resource",
"reference": "/reference/en_street_markers.csv"
},
"documentation": [
{ "source": "wikipedia", "reference": "https://en.wikipedia.org/wiki/Street_suffix" }
],
"backout": "[\\p{IsAlphabetic}\\.]+",
"priority": 84
},
{
"semanticType": "STREET_ADDRESS2_EN",
"description": "Street Address - Line 2 (English Language)",
"pluginType": "java",
"signature": "8Yl3CN3MVlSIjCrXBgZCWJskI1Q=",
"clazz": "com.cobber.fta.plugins.address.Address2EN",
"validLocales": [
{ "localeTag": "en", "headerRegExps": [ { "regExp": ".*(?i)(addr|street).*2", "confidence": 99 }, { "regExp": ".*(?i)(address|addr).+", "confidence": 90 } ] }
],
"threshold": 90,
"priority": 85
},
{
"semanticType": "STREET_ADDRESS3_EN",
"description": "Street Address - Line 3 (English Language)",
"pluginType": "java",
"signature": "swnXMC+o9QcQEBdo3yHQEeExVxo=",
"clazz": "com.cobber.fta.plugins.address.Address3EN",
"validLocales": [
{ "localeTag": "en", "headerRegExps": [ { "regExp": ".*(?i)(addr|street).*3", "confidence": 99 }, { "regExp": ".*(?i)(address|addr).+", "confidence": 90 } ] }
],
"threshold": 90,
"priority": 86
},
{
"semanticType": "STREET_ADDRESS4_EN",
"description": "Street Address - Line 4 (English Language)",
"pluginType": "java",
"signature": "1lNQdFYXnmRkNzRqwofC40ZHx9Q=",
"clazz": "com.cobber.fta.plugins.address.Address4EN",
"validLocales": [
{ "localeTag": "en", "headerRegExps": [ { "regExp": ".*(?i)(addr|street).*4", "confidence": 99 }, { "regExp": ".*(?i)(address|addr).+", "confidence": 90 } ] }
],
"threshold": 90,
"priority": 87
},
{
"semanticType": "STREET_NUMBER",
"description": "Street Number",
"pluginType": "java",
"signature": "JFmqXYZjmq/aTw/EALlxloQ/tgQ=",
"clazz": "com.cobber.fta.plugins.address.AddressStreetNumber",
"validLocales": [
{ "localeTag": "en", "headerRegExps": [ { "regExp": ".*(?i)(street|house|address).?(number|num|no)", "confidence": 99, "mandatory": true }, { "regExp": ".*(?i)(number|no|num)", "confidence": 80, "mandatory": true } ] },
{ "localeTag": "nl", "headerRegExps": [ { "regExp": "(?i)(huisnummer|huisnr.*)", "confidence": 99, "mandatory": true } ] }
],
"documentation": [
{ "source": "wikipedia", "reference": "https://en.wikipedia.org/wiki/House_numbering" }
],
"threshold": 95,
"priority": 88
},
{
"semanticType": "STREET_ADDRESS_",
"description": "Street Address",
"pluginType": "java",
"signature": "[NONE]",
"clazz": "com.cobber.fta.plugins.address.AddressOther",
"validLocales": [
{ "localeTag": "bg", "headerRegExps": [ { "regExp": "(?i)(?u)^адрес$", "confidence": 99, "mandatory": true } ] },
{ "localeTag": "ca", "headerRegExps": [ { "regExp": "(?i)(?u)^(adreça|adresse.*1)$", "confidence": 99, "mandatory": true } ] },
{ "localeTag": "da", "headerRegExps": [ { "regExp": "(?i)^(adresse|adresse.*1)$", "confidence": 99, "mandatory": true } ] },
{ "localeTag": "de", "headerRegExps": [ { "regExp": "(?i)^(adresse|adresse.*1|anschrift)$", "confidence": 99, "mandatory": true } ] },
{ "localeTag": "es", "headerRegExps": [ { "regExp": "(?i)(?u)^dirección$", "confidence": 99, "mandatory": true } ] },
{ "localeTag": "fi", "headerRegExps": [ { "regExp": "(?i)^(katuosoite|osoite)$", "confidence": 99, "mandatory": true } ] },
{ "localeTag": "fr", "headerRegExps": [ { "regExp": "(?i)^(adresse|adresse.*1)$", "confidence": 99, "mandatory": true } ] },
{ "localeTag": "hr", "headerRegExps": [ { "regExp": "(?i)^adresa$", "confidence": 99, "mandatory": true } ] },
{ "localeTag": "it", "headerRegExps": [ { "regExp": "(?i)^indirizzo$", "confidence": 99, "mandatory": true } ] },
{ "localeTag": "lv", "headerRegExps": [ { "regExp": "(?i)^adrese$", "confidence": 99, "mandatory": true } ] },
{ "localeTag": "nl", "headerRegExps": [ { "regExp": "(?i)^adres$", "confidence": 99, "mandatory": true } ] },
{ "localeTag": "pl", "headerRegExps": [ { "regExp": "(?i)^adres$", "confidence": 99, "mandatory": true } ] },
{ "localeTag": "pt", "headerRegExps": [ { "regExp": "(?i)(?u)^endereço$", "confidence": 99, "mandatory": true } ] },
{ "localeTag": "ro", "headerRegExps": [ { "regExp": "(?i)^adresa$", "confidence": 99, "mandatory": true } ] },
{ "localeTag": "ru", "headerRegExps": [ { "regExp": "(?i)(?u)^адрес$", "confidence": 99, "mandatory": true } ] },
{ "localeTag": "sk", "headerRegExps": [ { "regExp": "(?i)^adresa$", "confidence": 99, "mandatory": true } ] }
],
"threshold": 90,
"priority": 89
},
{
"semanticType": "STREET_NAME_BARE_",
"description": "Street Address",
"pluginType": "java",
"signature": "[NONE]",
"clazz": "com.cobber.fta.plugins.address.AddressStreetNameBare",
"validLocales": [
{ "localeTag": "nl", "headerRegExps": [ { "regExp": "(?i)^(straat|straatnaam)$", "confidence": 99, "mandatory": true } ] }
],
"threshold": 90,
"priority": 90
},
{
"semanticType": "GENDER.TEXT_",
"description": "Gender",
"pluginType": "java",
"signature": "[NONE]",
"clazz": "com.cobber.fta.plugins.Gender",
"validLocales": [
{ "localeTag": "bg", "headerRegExps": [ { "regExp": "(?i)(?u)(Gender|пол).*", "confidence": 90 } ] },
{ "localeTag": "ca", "headerRegExps": [ { "regExp": ".*(?i)(Gender|sexe).*", "confidence": 90 } ] },
{ "localeTag": "en", "headerRegExps": [ { "regExp": "(?i)(Gender|sex)", "confidence": 99 }, { "regExp": ".*(?i)(Gender|sex).*", "confidence": 90 } ] },
{ "localeTag": "de", "headerRegExps": [ { "regExp": ".*(?i)(Gender|sex|geschlecht).*", "confidence": 90 } ] },
{ "localeTag": "es", "headerRegExps": [ { "regExp": "(?i)(Gender|genero|Sexo)", "confidence": 99 }, { "regExp": ".*(?i)(Gender|Sexo).*", "confidence": 90 } ] },
{ "localeTag": "fi", "headerRegExps": [ { "regExp": ".*(?i)(Gender|Genre|Sukupuoli).*", "confidence": 90 } ] },
{ "localeTag": "fr", "headerRegExps": [ { "regExp": "(?i)(Gender|Genre|Sexe)", "confidence": 99 }, { "regExp": ".*(?i)(Gender|Genre|Sexe).*", "confidence": 90 } ] },
{ "localeTag": "hr", "headerRegExps": [ { "regExp": ".*(?i)(Gender).*", "confidence": 90 } ] },
{ "localeTag": "is", "headerRegExps": [ { "regExp": "(?i)(Gender|kyn)", "confidence": 99 }, { "regExp": ".*(?i)(Gender|kyn).*", "confidence": 90 } ] },
{ "localeTag": "it", "headerRegExps": [ { "regExp": "(?i)(Gender|genere|sesso)", "confidence": 99 }, { "regExp": ".*(?i)(Gender|genere|sesso).*", "confidence": 90 } ] },
{ "localeTag": "ms", "headerRegExps": [ { "regExp": ".*(?i)(Gender|jantina).*", "confidence": 90 } ] },
{ "localeTag": "nl", "headerRegExps": [ { "regExp": ".*(?i)(Gender|sexe|Geslach|Geslacht).*", "confidence": 90 } ] },
{ "localeTag": "pl", "headerRegExps": [ { "regExp": ".*(?i)(?u)(Gender|Płeć|P³eæ).*", "confidence": 90 } ] },
{ "localeTag": "pt", "headerRegExps": [ { "regExp": "(?i)(Gender|Sexo)", "confidence": 99 }, { "regExp": ".*(?i)(Gender|Sexo).*", "confidence": 90 } ] },
{ "localeTag": "ro", "headerRegExps": [ { "regExp": ".*(?i)(Gender|sex).*", "confidence": 90 } ] },
{ "localeTag": "ru", "headerRegExps": [ { "regExp": ".*(?i)(?u)(Gender|Пол).*", "confidence": 90 } ] },
{ "localeTag": "sv", "headerRegExps": [ { "regExp": ".*(?i)(Gender|kon|kön).*", "confidence": 90 } ] },
{ "localeTag": "tr", "headerRegExps": [ { "regExp": ".*(?i)(?u)(Gender|cinsiyet).*", "confidence": 90 } ] }
],
"documentation": [
{ "source": "wikidata", "reference": "https://www.wikidata.org/wiki/Property:P21" },
{ "source": "wikipedia", "reference": "https://en.wikipedia.org/wiki/Gender" },
{ "source": "schema", "reference": "https://schema.org/gender" }
],
"priority": 95
},
{
"semanticType" : "GENDER.TEXT_JA",
"description": "Gender (Japanese Language)",
"pluginType": "regex",
"signature": "Cw4ieuKHMT4qah2mJ9uWUYg+rNk=",
"validLocales": [
{
"localeTag": "ja",
"headerRegExps": [ { "regExp": "(性|性別)", "confidence": 70 } ],
"matchEntries": [ {
"regExpReturned" : "(女性|女|男性|男|その他)"
} ]
}
],
"content": {
"type": "inline",
"members": [ "女性", "女", "男性", "男", "その他" ]
},
"documentation": [
{ "source": "wikidata", "reference": "https://www.wikidata.org/wiki/Property:P21" },
{ "source": "wikipedia", "reference": "https://en.wikipedia.org/wiki/Gender" },
{ "source": "schema", "reference": "https://schema.org/gender" }
],
"backout": ".*",
"baseType" : "STRING",
"priority": 96
},
{
"semanticType" : "GENDER.TEXT_ZH",
"description": "Gender (Chinese Language)",
"pluginType": "regex",
"signature": "Cw4ieuKHMT4qah2mJ9uWUYg+rNk=",
"validLocales": [
{
"localeTag": "zh",
"headerRegExps": [ { "regExp": "(性|性別)", "confidence": 70 } ],
"matchEntries": [ {
"regExpReturned" : "(女性|女|女生|男性|男|男生)"
} ]
}
],
"content": {
"type": "inline",
"members": [ "女性" ,"女", "女生", "男性", "男", "男生" ]
},
"documentation": [
{ "source": "wikidata", "reference": "https://www.wikidata.org/wiki/Property:P21" },
{ "source": "wikipedia", "reference": "https://en.wikipedia.org/wiki/Gender" },
{ "source": "schema", "reference": "https://schema.org/gender" }
],
"backout": ".*",
"baseType" : "STRING",
"priority": 97
},
{
"semanticType" : "PERSON.AGE",
"description": "Age (person)",
"pluginType": "java",
"signature": "4IK7tmSs276PtQDC39Ggz27RB1g=",
"clazz": "com.cobber.fta.plugins.person.Age",
"validLocales": [
{
"localeTag": "en",
"headerRegExps": [ { "regExp": "(?i)(age|age[_ ].*|.*[_ ]age)", "confidence": 90, "mandatory": true } ]
},
{
"localeTag": "es",
"headerRegExps": [ { "regExp": "(?i)(edad)", "confidence": 90, "mandatory": true } ]
},
{
"localeTag": "fr",
"headerRegExps": [ { "regExp": "(?i)(?u)([aâ]ge|[aâ]ge[_ ].*|.*[_ '][aâ]ge)", "confidence": 90, "mandatory": true } ]
},
{
"localeTag": "it",
"headerRegExps": [ { "regExp": "(?i)(?u)(età)", "confidence": 90, "mandatory": true } ]
},
{
"localeTag": "nl",
"headerRegExps": [ { "regExp": "(?i)(leeftijd)", "confidence": 90, "mandatory": true } ]
},
{
"localeTag": "pt",
"headerRegExps": [ { "regExp": "(?i)(idade)", "confidence": 90, "mandatory": true } ]
}
],
"baseType" : "LONG",
"priority": 98
},
{
"semanticType" : "PERSON.AGE_RANGE",
"description": "Age range (person)",
"pluginType": "java",
"signature": "GrV4FjafBbHWYAXm6qKNFdpmfi8=",
"clazz": "com.cobber.fta.plugins.person.AgeRange",
"validLocales": [
{
"localeTag": "en",
"headerRegExps": [
{ "regExp": "(?i)(age|ages|age[_ ].*|.*[_ ]age)", "confidence": 90, "mandatory": true },
{ "regExp": "(?i)age.*", "confidence": 60, "mandatory": true }
]
},
{
"localeTag": "es",
"headerRegExps": [ { "regExp": "(?i).*edad.*", "confidence": 90, "mandatory": true } ]
},
{
"localeTag": "fr",
"headerRegExps": [
{ "regExp": "(?i)(?u)([aâ]ge|[aâ]ge[_ ].*|.*[_ '][aâ]ge)", "confidence": 90, "mandatory": true },
{ "regExp": "(?i)(?u)âge.*", "confidence": 60, "mandatory": true }
]
},
{
"localeTag": "it",
"headerRegExps": [ { "regExp": "(?i)(?u)(età)", "confidence": 90, "mandatory": true } ]
},
{
"localeTag": "nl",
"headerRegExps": [ { "regExp": "(?i)leeftijd.*", "confidence": 90, "mandatory": true } ]
},
{
"localeTag": "pt",
"headerRegExps": [ { "regExp": "(?i)idade.*", "confidence": 90, "mandatory": true } ]
}
],
"priority": 99
},
{
"semanticType" : "PERSON.RACE_EN",
"description": "Race/Ethnicity (person)",
"pluginType": "java",
"signature": "20Jx6q02Vkew5xiX87Cnvi2EVf4=",
"clazz": "com.cobber.fta.plugins.person.Race",
"validLocales": [
{
"localeTag": "*",
"headerRegExps": [ { "regExp": ".*(?i)(race|ethnic).*", "confidence": 95, "mandatory": true } ]
}
],
"documentation": [
{ "source": "wikipedia", "reference": "https://en.wikipedia.org/wiki/Race_(human_categorization)" }
],
"priority": 100
},
{
"semanticType" : "PERSON.RACE_ABBR_EN",
"description": "Race/Ethnicity (person)",
"pluginType": "java",
"signature": "exN+QvGFqAfnTL793VLPx85wmQ0=",
"clazz": "com.cobber.fta.plugins.person.RaceAbbr",
"validLocales": [
{
"localeTag": "*",
"headerRegExps": [ { "regExp": "(?i)(race|ethnic).*|.*(?i)(race|ethnicity)", "confidence": 95, "mandatory": true } ]
}
],
"documentation": [
{ "source": "wikipedia", "reference": "https://en.wikipedia.org/wiki/Race_(human_categorization)" }
],
"priority": 101
},
{
"semanticType" : "PERSON.MARITAL_STATUS_EN",
"description": "Marital Status (person)",
"pluginType": "java",
"signature": "BHhRzS4WZnSye7mgRa+J3L1fEWQ=",
"clazz": "com.cobber.fta.plugins.person.MaritalStatus",
"validLocales": [
{
"localeTag": "*",
"headerRegExps": [ { "regExp": ".*(?i)(marital.?status).*", "confidence": 95, "mandatory": true } ]
}
],
"documentation": [
{ "source": "wikipedia", "reference": "https://en.wikipedia.org/wiki/Marital_status" }
],
"priority": 102
},
{
"semanticType": "NATIONALITY_EN",
"description": "Nationality (English Language)",
"pluginType": "list",
"signature": "FO3IMfeesbLJh6WwceQWPVORcnE=",
"validLocales": [
{ "localeTag": "en", "headerRegExps": [ { "regExp": ".*(?i)(nationality).*", "confidence": 90 } ] }
],
"ignoreList": [ "N/A", "OTHER" ],
"content": {
"type": "resource",
"reference": "/reference/en_nationality.csv"
},
"documentation": [
{ "source": "wikipedia", "reference": "https://en.wikipedia.org/wiki/Nationality" },
{ "source": "schema", "reference": "https://schema.org/nationality" }
],
"backout": "[\\p{IsAlphabetic}\\.]+",
"priority": 103
},
{
"semanticType": "NATIONALITY_NL",
"description": "Nationality (Dutch Language)",
"pluginType": "list",
"signature": "1oOVHBz4YE+HmzPDQSy/OjpSBiA=",
"validLocales": [
{ "localeTag": "nl", "headerRegExps": [ { "regExp": ".*(?i)(nationaliteit).*", "confidence": 90 } ] }
],
"ignoreList": [ "N/A", "OTHER" ],
"content": {
"type": "resource",
"reference": "/reference/nl_nationality.csv"
},
"documentation": [
{ "source": "wikipedia", "reference": "https://en.wikipedia.org/wiki/Nationality" },
{ "source": "schema", "reference": "https://schema.org/nationality" }
],
"backout": "[\\p{IsAlphabetic}\\.]+",
"priority": 104
},
{
"semanticType": "HONORIFIC_EN",
"description": "Honorific (English Language)",
"pluginType": "list",
"signature": "/Di73LZHHGjcJYhigTqSTQrtTvA=",
"validLocales": [
{ "localeTag": "en", "headerRegExps": [ { "regExp": ".*(?i)(honorific|title).*", "confidence": 90 } ] }
],
"ignoreList": [ "N/A", "OTHER" ],
"content": {
"type": "resource",
"reference": "/reference/en_honorific.csv"
},
"documentation": [
{ "source": "wikidata", "reference": "https://www.wikidata.org/wiki/Property:P511" },
{ "source": "wikipedia", "reference": "https://en.wikipedia.org/wiki/English_honorifics" },
{ "source": "schema", "reference": "https://schema.org/honorificPrefix" }
],
"backout": "[\\p{IsAlphabetic}\\.]+",
"priority": 105
},
{
"semanticType": "COUNTRY.TEXT_DE",
"description": "Country as a string (German)",
"pluginType": "list",
"signature": "Rs6U63buoAAlnITZdPtJuxUrgNg=",
"validLocales": [
{ "localeTag": "de", "headerRegExps": [ { "regExp": ".*(?i)(land).*", "confidence": 90 } ] }
],
"content": {
"type": "resource",
"reference": "/reference/de_countries.csv"
},
"documentation": [
{ "source": "wikipedia", "reference": "https://en.wikipedia.org/wiki/Choronym" },
{ "source": "wikipedia", "reference": "https://en.wikipedia.org/wiki/List_of_country_names_in_various_languages" },
{ "source": "schema", "reference": "https://schema.org/Country" }
],
"backout": "[\\p{IsAlphabetic}\\.]+",
"priority": 106
},
{
"semanticType": "COUNTRY.TEXT_ES",
"description": "Country as a string (Spanish)",
"pluginType": "list",
"signature": "fot3XHPIh18wTcBDyeN3DlY7LYY=",
"validLocales": [
{ "localeTag": "es", "headerRegExps": [ { "regExp": ".*(?i)(pais).*", "confidence": 90 } ] }
],
"content": {
"type": "resource",
"reference": "/reference/es_countries.csv"
},
"documentation": [
{ "source": "wikipedia", "reference": "https://en.wikipedia.org/wiki/Choronym" },
{ "source": "wikipedia", "reference": "https://en.wikipedia.org/wiki/List_of_country_names_in_various_languages" },
{ "source": "schema", "reference": "https://schema.org/Country" }
],
"threshold": 90,
"backout": "[\\p{IsAlphabetic}\\.]+",
"priority": 107
},
{
"semanticType": "COUNTRY.TEXT_NL",
"description": "Country as a string (Dutch)",
"pluginType": "list",
"signature": "SVnejJJWKhuw1LMRsCaHojewEOk=",
"validLocales": [
{ "localeTag": "nl", "headerRegExps": [ { "regExp": ".*(?i)(land).*", "confidence": 90 } ] }
],
"content": {
"type": "resource",
"reference": "/reference/nl_countries.csv"
},
"documentation": [
{ "source": "wikipedia", "reference": "https://en.wikipedia.org/wiki/Choronym" },
{ "source": "wikipedia", "reference": "https://en.wikipedia.org/wiki/List_of_country_names_in_various_languages" },
{ "source": "schema", "reference": "https://schema.org/Country" }
],
"threshold": 90,
"backout": "[\\p{IsAlphabetic}\\.]+",
"priority": 108
},
{
"semanticType": "COUNTRY.TEXT_EN",
"description": "Country as a string (English language)",
"pluginType": "java",
"signature": "T4UZNFT895GsC99J7dOz/ENNYvM=",
"clazz": "com.cobber.fta.plugins.CountryEN",
"validLocales": [
{
"localeTag": "*",
"headerRegExps": [ { "regExp": ".*(?i)(country).*", "confidence": 90 } ],
"matchEntries": [ {
"regExpReturned": "[\\p{IsAlphabetic}][-\\p{IsAlphabetic} '\\.(),]+"
} ]
}
],
"content": {
"type": "resource",
"reference": "/reference/en_countries.csv"
},
"documentation": [
{ "source": "wikipedia", "reference": "https://en.wikipedia.org/wiki/Choronym" },
{ "source": "wikipedia", "reference": "https://en.wikipedia.org/wiki/List_of_country_names_in_various_languages" },
{ "source": "schema", "reference": "https://schema.org/Country" }
],
"threshold": 85,
"backout": ".+",
"priority": 109
},
{
"semanticType": "MONTH.ABBR_",
"description": "Month Abbreviation = Locale, e.g. en-US for English language in US)",
"pluginType": "java",
"signature": "[NONE]",
"clazz": "com.cobber.fta.plugins.MonthAbbr",
"validLocales": [ { "localeTag": "*" } ],
"priority": 110
},
{
"semanticType": "MONTH.FULL_",
"description": "Full Month name = Locale, e.g. en-US for English language in US)",
"pluginType": "java",
"signature": "[NONE]",
"clazz": "com.cobber.fta.plugins.MonthFull",
"validLocales": [ { "localeTag": "*" } ],
"documentation": [
{ "source": "wikipedia", "reference": "https://en.wikipedia.org/wiki/Month" }
],
"priority": 111
},
{
"semanticType": "DAY.ABBR_",
"description": "Day of Week Abbreviation = Locale, e.g. en-US for English language in US)",
"pluginType": "java",
"signature": "[NONE]",
"clazz": "com.cobber.fta.plugins.DOWAbbr",
"validLocales": [ { "localeTag": "*" } ],
"priority": 112
},
{
"semanticType": "DAY.FULL_",
"description": "Full Day of Week name = Locale, e.g. en-US for English language in US)",
"pluginType": "java",
"signature": "[NONE]",
"clazz": "com.cobber.fta.plugins.DOWFull",
"validLocales": [ { "localeTag": "*" } ],
"documentation": [
{ "source": "wikipedia", "reference": "https://en.wikipedia.org/wiki/Names_of_the_days_of_the_week" }
],
"priority": 113
},
{
"semanticType": "PERIOD.QUARTER",
"description": "Quarter (Year)",
"pluginType": "java",
"signature": "H0LOGKpMF3InUXIIU5pCKHEReTo=",
"clazz": "com.cobber.fta.plugins.PeriodQuarter",
"validLocales": [
{
"localeTag": "en",
"headerRegExps": [ { "regExp": ".*(?i)(quarter|qtr).*", "confidence": 99, "mandatory": true } ]
},
{
"localeTag": "nl",
"headerRegExps": [ { "regExp": ".*(?i)(periode).*", "confidence": 99, "mandatory": true } ]
} ],
"priority": 114
},
{
"semanticType": "PERIOD.HALF",
"description": "Half (Year)",
"pluginType": "regex",
"signature": "lc0Ep9P3R6hDY6EIlSvRtjjvfbc=",
"validLocales": [
{
"localeTag": "*",
"headerRegExps": [ { "regExp": ".*(?i)(half).*", "confidence": 99 } ],
"matchEntries": [ {
"regExpReturned": "(?i)(H1|H2)",
"isRegExpComplete": true
} ]
}
],
"priority": 115
},
{
"semanticType": "PERIOD.YEAR_RANGE",
"description": "Year Range",
"pluginType": "java",
"signature": "nA7JzkjHCLvvRAfhvJv12v4FNgU=",
"clazz": "com.cobber.fta.plugins.PeriodYearRange",
"validLocales": [ { "localeTag": "*" } ],
"priority": 116
},
{
"semanticType": "STATE_PROVINCE.PROVINCE_CA",
"description": "Canadian Province Code",
"pluginType": "list",
"signature": "jwzKHMfuq3AO4lEKEm0e/ZmOIRA=",
"validLocales": [
{ "localeTag": "en-US,en-CA,fr-CA,en-MX", "headerRegExps": [ { "regExp": ".*(?i)(province).*", "confidence": 90 } ] }
],
"content": {
"type": "resource",
"reference": "/reference/ca_provinces.csv"
},
"documentation": [
{ "source": "wikipedia", "reference": "https://en.wikipedia.org/wiki/Provinces_and_territories_of_Canada" },
{ "source": "schema", "reference": "https://schema.org/State" }
],
"backout": "\\p{IsAlphabetic}{2}",
"priority": 120
},
{
"semanticType": "STATE_PROVINCE.STATE_MX",
"description": "Mexican State Code",
"pluginType": "list",
"signature": "h565UW3Wl3GYzYAriMJM6T1LsmY=",
"validLocales": [
{ "localeTag": "en-US,en-CA,fr-CA,en-MX,es-MX", "headerRegExps": [ { "regExp": ".*(?i)(estado).*", "confidence": 90 } ] }
],
"content": {
"type": "resource",
"reference": "/reference/mx_states.csv"
},
"documentation": [
{ "source": "wikipedia", "reference": "https://en.wikipedia.org/wiki/List_of_states_of_Mexico" },
{ "source": "schema", "reference": "https://schema.org/State" }
],
"backout": "\\p{IsAlphabetic}{3}",
"priority": 121
},
{
"semanticType": "STATE_PROVINCE.STATE_US",
"description": "US State Code",
"pluginType": "list",
"signature": "JD5jeXHLzGctpqicY44B9iJzyXU=",
"validLocales": [
{ "localeTag": "en-US,en-Latn-US,en-CA,fr-CA,en-MX", "headerRegExps": [ { "regExp": ".*(?i)(state).*", "confidence": 90 } ] }
],
"content": {
"type": "resource",
"reference": "/reference/us_states.csv"
},
"documentation": [
{ "source": "wikipedia", "reference": "https://en.wikipedia.org/wiki/List_of_states_and_territories_of_the_United_States" },
{ "source": "schema", "reference": "https://schema.org/State" }
],
"backout": "\\p{IsAlphabetic}{2}",
"priority": 122
},
{
"semanticType": "STATE_PROVINCE.STATE_PROVINCE_NA",
"description": "US State Code/Canadian Province Code/Mexican State Code",
"pluginType": "list",
"signature": "Q00LXfhmPibwrK8HTkzNsRosvzw=",
"validLocales": [
{
"localeTag": "en-US,en-CA,fr-CA,en-MX",
"headerRegExps": [ { "regExp": ".*(?i)(state|province|estado).*", "confidence": 90 } ],
"matchEntries": [ {
"regExpReturned": "\\p{Alpha}{2}"
} ]
}
],
"content": {
"type": "resource",
"reference": "/reference/na_states_provinces.csv"
},
"documentation": [
{ "source": "schema", "reference": "https://schema.org/State" }
],
"backout": "\\p{IsAlphabetic}{2}",
"priority": 123
},
{
"semanticType": "STATE_PROVINCE.STATE_AU",
"description": "Australian State Code",
"pluginType": "list",
"signature": "khHytrFa0Oj4KP/37i2mRhJmliU=",
"validLocales": [
{
"localeTag": "en-AU",
"headerRegExps": [ { "regExp": ".*(?i)(state).*", "confidence": 90 } ],
"matchEntries": [ {
"regExpReturned": "(?i)(ACT|NSW|NT|QLD|SA|TAS|VIC|WA)"
} ]
}
],
"content": {
"type": "inline",
"members": [ "ACT", "NSW", "NT", "QLD", "SA", "TAS", "VIC", "WA" ]
},
"documentation": [
{ "source": "wikipedia", "reference": "https://en.wikipedia.org/wiki/States_and_territories_of_Australia" },
{ "source": "schema", "reference": "https://schema.org/State" }
],
"backout": "\\p{IsAlphabetic}{2,3}",
"priority": 124
},
{
"semanticType": "STATE_PROVINCE.PROVINCE_IT",
"description": "Italian Province Code",
"pluginType": "list",
"signature": "0vMZaBH760lIeD7hdvi7RVIDoVc=",
"validLocales": [
{ "localeTag": "it-IT", "headerRegExps": [ { "regExp": ".*(?i)(province|provincia).*", "confidence": 90 } ] }
],
"content": {
"type": "resource",
"reference": "/reference/it_provinces.csv"
},
"documentation": [
{ "source": "wikipedia", "reference": "https://en.wikipedia.org/wiki/Provinces_of_Italy" },
{ "source": "schema", "reference": "https://schema.org/State" }
],
"backout": "\\p{IsAlphabetic}{2}",
"priority": 125
},
{
"semanticType": "STATE_PROVINCE.CANTON_CH",
"description": "Swiss CANTON Code",
"pluginType": "list",
"signature": "YNu63sC5qbl7DWY0aV4khfLKrXs=",
"validLocales": [
{ "localeTag": "de-CH,fr-CH,it-CH", "headerRegExps": [ { "regExp": ".*(?i)(canton|kanton|cantone).*", "confidence": 90 } ] }
],
"content": {
"type": "resource",
"reference": "/reference/ch_cantons.csv"
},
"documentation": [
{ "source": "wikipedia", "reference": "https://en.wikipedia.org/wiki/Cantons_of_Switzerland" },
{ "source": "schema", "reference": "https://schema.org/State" }
],
"backout": "\\p{IsAlphabetic}{2}",
"priority": 126
},
{
"semanticType": "STATE_PROVINCE.STATE_BR",
"description": "Brazilian State Code",
"pluginType": "list",
"signature": "5B0N5wsZpS+g/ck2cXCQjtqYwXA=",
"validLocales": [
{ "localeTag": "pt-BR", "headerRegExps": [ { "regExp": "(?i)uf", "confidence": 99 }, { "regExp": ".*(?i)(estado|state).*", "confidence": 90 } ] }
],
"content": {
"type": "resource",
"reference": "/reference/br_states.csv"
},
"documentation": [
{ "source": "wikipedia", "reference": "https://en.wikipedia.org/wiki/Federative_units_of_Brazil" },
{ "source": "schema", "reference": "https://schema.org/State" }
],
"backout": "\\p{IsAlphabetic}{2}",
"priority": 127
},
{
"semanticType": "STATE_PROVINCE.PROVINCE_ZA",
"description": "South African Province Code",
"pluginType": "list",
"signature": "nXFbO6uiHPMEct83mAPMsziYPtI=",
"validLocales": [
{ "localeTag": "en-ZA", "headerRegExps": [ { "regExp": ".*(?i)(province).*", "confidence": 90 } ] }
],
"content": {
"type": "resource",
"reference": "/reference/za_provinces.csv"
},
"documentation": [
{ "source": "wikipedia", "reference": "https://en.wikipedia.org/wiki/Provinces_of_South_Africa" },
{ "source": "schema", "reference": "https://schema.org/State" }
],
"backout": "\\p{IsAlphabetic}{2}",
"priority": 128
},
{
"semanticType": "STATE_PROVINCE.PROVINCE_NAME_CA",
"description": "Canadian Province Name",
"pluginType": "list",
"signature": "hiCNMWvc1MO99KTP8IaH1Fp3s3Y=",
"validLocales": [
{
"localeTag": "en-US,en-CA,fr-CA,en-MX",
"headerRegExps": [ { "regExp": ".*(?i)(province).*", "confidence": 90 } ],
"matchEntries": [ {
"regExpReturned": "[- \\p{IsAlphabetic}]+"
} ]
}
],
"content": {
"type": "resource",
"reference": "/reference/ca_provinces_full.csv"
},
"documentation": [
{ "source": "wikipedia", "reference": "https://en.wikipedia.org/wiki/Provinces_and_territories_of_Canada" },
{ "source": "schema", "reference": "https://schema.org/State" }
],
"backout": "[- \\p{IsAlphabetic}]+",
"priority": 130
},
{
"semanticType": "STATE_PROVINCE.STATE_NAME_MX",
"description": "Mexican State Name",
"pluginType": "list",
"signature": "f5Bx+omlv1xMG6Oq8XQo5RkrtmU=",
"validLocales": [
{
"localeTag": "en-US,es-US,en-CA,fr-CA,en-MX,es-MX",
"headerRegExps": [ { "regExp": ".*(?i)(estado).*", "confidence": 90 } ],
"matchEntries": [ {
"regExpReturned": "[ \\p{IsAlphabetic}]+"
} ]
}
],
"content": {
"type": "resource",
"reference": "/reference/mx_states_full.csv"
},
"documentation": [
{ "source": "wikipedia", "reference": "https://en.wikipedia.org/wiki/List_of_states_of_Mexico" },
{ "source": "schema", "reference": "https://schema.org/State" }
],
"backout": "[ \\p{IsAlphabetic}]+",
"priority": 131
},
{
"semanticType": "STATE_PROVINCE.STATE_NAME_US",
"description": "US State Name",
"pluginType": "list",
"signature": "y0oxFvZb1RpG1UVwi/hSCEymwzc=",
"validLocales": [
{
"localeTag": "en-US,es-US,en-CA,fr-CA,en-MX",
"headerRegExps": [ { "regExp": ".*(?i)(state).*", "confidence": 90 } ],
"matchEntries": [ {
"regExpReturned": "[ \\p{IsAlphabetic}]+"
} ]
}
],
"content": {
"type": "resource",
"reference": "/reference/us_states_full.csv"
},
"documentation": [
{ "source": "wikipedia", "reference": "https://en.wikipedia.org/wiki/List_of_states_and_territories_of_the_United_States" },
{ "source": "schema", "reference": "https://schema.org/State" }
],
"backout": "[ \\p{IsAlphabetic}]+",
"priority": 132
},
{
"semanticType": "STATE_PROVINCE.STATE_PROVINCE_NAME_NA",
"description": "US State Name/Canadian Province Name/Mexican State Name",
"pluginType": "list",
"signature": "KfDjCnkj/KmZglkvM32W3OBEwxU=",
"validLocales": [
{
"localeTag": "en-US,es-US,en-CA,fr-CA,en-MX",
"headerRegExps": [ { "regExp": ".*(?i)(state|province|estado).*", "confidence": 90 } ],
"matchEntries": [ {
"regExpReturned": "[\\p{IsAlphabetic} ]+"
} ]
}
],
"content": {
"type": "resource",
"reference": "/reference/na_states_provinces_full.csv"
},
"documentation": [
{ "source": "schema", "reference": "https://schema.org/State" }
],
"backout": "[ \\p{IsAlphabetic}]+",
"priority": 133
},
{
"semanticType": "STATE_PROVINCE.STATE_NAME_AU",
"description": "Australian State Name",
"pluginType": "list",
"signature": "iNmmCNk8cEQ6mQuhOTxSlO+nvUk=",
"validLocales": [
{
"localeTag": "en-AU",
"headerRegExps": [ { "regExp": ".*(?i)(state).*", "confidence": 90 } ],
"matchEntries": [ {
"regExpReturned": "[\\p{IsAlphabetic} ]+"
} ]
}
],
"content": {
"type": "resource",
"reference": "/reference/au_states_full.csv"
},
"documentation": [
{ "source": "wikipedia", "reference": "https://en.wikipedia.org/wiki/States_and_territories_of_Australia" },
{ "source": "schema", "reference": "https://schema.org/State" }
],
"backout": "[ \\p{IsAlphabetic}]+",
"priority": 134
},
{
"semanticType": "STATE_PROVINCE.STATE_NAME_DE",
"description": "German State Name",
"pluginType": "list",
"signature": "bEx7JkLIUY8fjFyEhsjeJfx2k6o=",
"validLocales": [
{
"localeTag": "de-DE",
"headerRegExps": [ { "regExp": ".*(?i)(state|staat).*", "confidence": 90 } ],
"matchEntries": [ {
"regExpReturned": "[- \\p{IsAlphabetic}]+"
} ]
}
],
"content": {
"type": "resource",
"reference": "/reference/de_states_full.csv"
},
"documentation": [
{ "source": "wikipedia", "reference": "https://en.wikipedia.org/wiki/States_of_Germany" },
{ "source": "schema", "reference": "https://schema.org/State" }
],
"backout": "[ \\p{IsAlphabetic}]+",
"priority": 135
},
{
"semanticType": "STATE_PROVINCE.REGION_NAME_FR",
"description": "French Region",
"pluginType": "list",
"signature": "hiZwJanMwVKNX7yumKr1rNKQNN8=",
"validLocales": [
{
"localeTag": "fr-FR",
"headerRegExps": [ { "regExp": ".*(?i)(?u)(region|région).*", "confidence": 90 } ],
"matchEntries": [ {
"regExpReturned": "[-' \\p{IsAlphabetic}]+"
} ]
}
],
"content": {
"type": "resource",
"reference": "/reference/fr_regions.csv"
},
"backout": "[ \\p{IsAlphabetic}]+",
"priority": 136
},
{
"semanticType": "STATE_PROVINCE.DEPARTMENT_NAME_FR",
"description": "French Department",
"pluginType": "list",
"signature": "oOZtEv/rhMuaXVd2SLFBvR1VShI=",
"validLocales": [
{
"localeTag": "fr-FR",
"headerRegExps": [ { "regExp": ".*(?i)(?u)(department|département).*", "confidence": 90 } ],
"matchEntries": [ {
"regExpReturned": "[-' \\p{IsAlphabetic}]+"
} ]
}
],
"content": {
"type": "resource",
"reference": "/reference/fr_department.csv"
},
"backout": "[ \\p{IsAlphabetic}]+",
"priority": 137
},
{
"semanticType": "STATE_PROVINCE.INSEE_CODE_FR",
"description": "French Insee Code (5 digit)",
"pluginType": "java",
"signature": "2dBxTIccKcNhE+xvma/5fTAfhiw=",
"clazz": "com.cobber.fta.plugins.InseeCodeFR",
"validLocales": [
{ "localeTag": "fr-FR", "headerRegExps": [ { "regExp": ".*(?i)(insee).*", "confidence": 95 } ] }
],
"documentation": [
{ "source": "wikipedia", "reference": "https://en.wikipedia.org/wiki/INSEE_code" }
],
"baseType": "LONG",
"backout": "\\d{5}",
"priority": 138
},
{
"semanticType": "STATE_PROVINCE.PROVINCE_NAME_IT",
"description": "Italian Province Name",
"pluginType": "list",
"signature": "veLvb2gbLjr395Sbu+jeP0R9ciQ=",
"validLocales": [
{
"localeTag": "it-IT",
"headerRegExps": [ { "regExp": ".*(?i)(province|provincia).*", "confidence": 90 } ],
"matchEntries": [ {
"regExpReturned": "[-' \\p{IsAlphabetic}]+"
} ]
}
],
"content": {
"type": "resource",
"reference": "/reference/it_provinces_full.csv"
},
"documentation": [
{ "source": "wikipedia", "reference": "https://en.wikipedia.org/wiki/Provinces_of_Italy" },
{ "source": "schema", "reference": "https://schema.org/State" }
],
"backout": "[ \\p{IsAlphabetic}]+",
"priority": 139
},
{
"semanticType": "STATE_PROVINCE.PROVINCE_NAME_ES",
"description": "Spanish Province Name",
"pluginType": "list",
"signature": "w5axJ/mMkNw2fiYY3xw7ZDvRurM=",
"validLocales": [
{
"localeTag": "es-ES",
"headerRegExps": [ { "regExp": ".*(?i)(province|provincias|provincia).*", "confidence": 90 } ],
"matchEntries": [ {
"regExpReturned": "[ \\p{IsAlphabetic}]+"
} ]
}
],
"content": {
"type": "resource",
"reference": "/reference/es_provinces_full.csv"
},
"documentation": [
{ "source": "wikipedia", "reference": "https://en.wikipedia.org/wiki/Provinces_of_Spain" },
{ "source": "schema", "reference": "https://schema.org/State" }
],
"backout": "[ \\p{IsAlphabetic}]+",
"priority": 140
},
{
"semanticType": "STATE_PROVINCE.PROVINCE_NAME_NL",
"description": "Netherlands Province Name",
"pluginType": "list",
"signature": "LfF0rgcJobv3P/9fW8+SAzpl//c=",
"validLocales": [
{
"localeTag": "en-NL,nl-NL",
"headerRegExps": [ { "regExp": ".*(?i)(province|provincie).*", "confidence": 99 } ],
"matchEntries": [ {
"regExpReturned": "[- \\p{IsAlphabetic}]+"
} ]
}
],
"content": {
"type": "resource",
"reference": "/reference/nl_provinces_full.csv"
},
"documentation": [
{ "source": "wikipedia", "reference": "https://en.wikipedia.org/wiki/Provinces_of_the_Netherlands" },
{ "source": "schema", "reference": "https://schema.org/State" }
],
"backout": "[- \\p{IsAlphabetic}]+",
"priority": 141
},
{
"semanticType": "STATE_PROVINCE.COUNTY_US",
"description": "US County Name",
"pluginType": "list",
"signature": "NkMoovh9DwxDIeJXza8dsJ4wRzY=",
"validLocales": [
{
"localeTag": "en-US",
"headerRegExps": [ { "regExp": ".*(?i)(county).*", "confidence": 90 } ],
"matchEntries": [ {
"regExpReturned": "[-\\.,' \\p{IsAlphabetic}]+"
} ]
}
],
"content": {
"type": "resource",
"reference": "/reference/us_counties_full.csv"
},
"documentation": [
{ "source": "wikipedia", "reference": "https://en.wikipedia.org/wiki/County_(United_States)" }
],
"backout": "[-,\\.,' \\p{IsAlphabetic}]+",
"priority": 142
},
{
"semanticType": "STATE_PROVINCE.COUNTY_UK",
"description": "United Kingdom County Name",
"pluginType": "list",
"signature": "ppbqIL83hfnExGV8bdzIoA3hLN8=",
"validLocales": [
{
"localeTag": "en-GB,en-UK",
"headerRegExps": [ { "regExp": ".*(?i)(county).*", "confidence": 90 } ],
"matchEntries": [ {
"regExpReturned": "[-,& \\p{IsAlphabetic}]+"
} ]
}
],
"content": {
"type": "resource",
"reference": "/reference/gb_counties_full.csv"
},
"documentation": [
{ "source": "wikipedia", "reference": "https://en.wikipedia.org/wiki/Counties_of_the_United_Kingdom" }
],
"backout": "[-,& \\p{IsAlphabetic}]+",
"priority": 143
},
{
"semanticType": "STATE_PROVINCE.CANTON_NAME_CH",
"description": "Swiss CANTON Name",
"pluginType": "list",
"signature": "s2RWNkJraOojAx4YB3NlVxPjqOY=",
"validLocales": [
{
"localeTag": "de-CH,fr-CH,it-CH",
"headerRegExps": [ { "regExp": ".*(?i)(canton|kanton|cantone).*", "confidence": 90 } ],
"matchEntries": [ {
"regExpReturned": "[-\\. \\p{IsAlphabetic}]+"
} ]
}
],
"content": {
"type": "resource",
"reference": "/reference/ch_cantons_full.csv"
},
"documentation": [
{ "source": "wikipedia", "reference": "https://en.wikipedia.org/wiki/Cantons_of_Switzerland" }
],
"backout": "[-\\. \\p{IsAlphabetic}]+",
"priority": 144
},
{
"semanticType": "STATE_PROVINCE.STATE_NAME_BR",
"description": "Brazilian State Name",
"pluginType": "list",
"signature": "Av9xqFJX7iwzve2N0bwz5yImxnM=",
"validLocales": [
{
"localeTag": "pt-BR",
"headerRegExps": [ { "regExp": ".*(?i)(estado|state).*", "confidence": 90 } ],
"matchEntries": [ {
"regExpReturned": "[-\\. \\p{IsAlphabetic}]+"
} ]
}
],
"content": {
"type": "resource",
"reference": "/reference/br_states_full.csv"
},
"documentation": [
{ "source": "wikipedia", "reference": "https://en.wikipedia.org/wiki/Federative_units_of_Brazil" },
{ "source": "schema", "reference": "https://schema.org/State" }
],
"backout": "[-\\. \\p{IsAlphabetic}]+",
"priority": 145
},
{
"semanticType": "STATE_PROVINCE.PREFECTURE_NAME_JA",
"description": "Japanese Prefecture Name",
"pluginType": "list",
"signature": "qUPFgdl8kNvmZ8M55kR4qaFp184=",
"validLocales": [
{
"localeTag": "ja",
"headerRegExps": [ { "regExp": ".*(?i)(都道府県|todōfuken).*", "confidence": 90 } ],
"matchEntries": [ {
"regExpReturned": "[-\\. \\p{IsAlphabetic}]+"
} ]
}
],
"content": {
"type": "resource",
"reference": "/reference/ja_prefectures_full.csv"
},
"documentation": [
{ "source": "wikipedia", "reference": "https://en.wikipedia.org/wiki/Prefectures_of_Japan" }
],
"backout": "[-\\. \\p{IsAlphabetic}]+",
"priority": 146
},
{
"semanticType": "STATE_PROVINCE.PROVINCE_NAME_ZA",
"description": "South African Province Name",
"pluginType": "list",
"signature": "79CAHTLod2FXV8V4iLZvXQ5r61M=",
"validLocales": [
{
"localeTag": "en-ZA",
"headerRegExps": [ { "regExp": ".*(?i)(province).*", "confidence": 90 } ],
"matchEntries": [ {
"regExpReturned": "[ \\p{IsAlphabetic}]+"
} ]
}
],
"content": {
"type": "resource",
"reference": "/reference/za_provinces_full.csv"
},
"documentation": [
{ "source": "wikipedia", "reference": "https://en.wikipedia.org/wiki/Provinces_of_South_Africa" },
{ "source": "schema", "reference": "https://schema.org/State" }
],
"backout": "[ \\p{IsAlphabetic}]+",
"priority": 147
},
{
"semanticType": "STATE_PROVINCE.PROVINCE_NAME_EC",
"description": "Ecuadorian Province Name",
"pluginType": "list",
"signature": "rre1QxKeEKPUbmo5hHdo62LHQKg=",
"validLocales": [
{
"localeTag": "es-EC",
"headerRegExps": [ { "regExp": ".*(?i)(provincia).*", "confidence": 90 } ],
"matchEntries": [ {
"regExpReturned": "[ \\p{IsAlphabetic}]+"
} ]
}
],
"content": {
"type": "resource",
"reference": "/reference/ec_provinces_full.csv"
},
"documentation": [
{ "source": "wikipedia", "reference": "https://en.wikipedia.org/wiki/Provinces_of_Ecuador" },
{ "source": "schema", "reference": "https://schema.org/State" }
],
"backout": "[ \\p{IsAlphabetic}]+",
"priority": 148
},
{
"semanticType": "STATE_PROVINCE.DISTRICT_NAME_PT",
"description": "Portuguese District Name",
"pluginType": "list",
"signature": "zx5UQndn84s9pYXMKYEV/HEuu9U=",
"validLocales": [
{
"localeTag": "pt-PT",
"headerRegExps": [ { "regExp": ".*(?i)(Distritos|District).*", "confidence": 90 } ],
"matchEntries": [ {
"regExpReturned": "[ \\p{IsAlphabetic}]+"
} ]
}
],
"content": {
"type": "resource",
"reference": "/reference/pt_districts_full.csv"
},
"documentation": [
{ "source": "wikipedia", "reference": "https://en.wikipedia.org/wiki/List_of_municipalities_of_Portugal" }
],
"backout": "[ \\p{IsAlphabetic}]+",
"priority": 149
},
{
"semanticType": "STATE_PROVINCE.MUNICIPALITY_BR",
"description": "Brazilian Municipality",
"pluginType": "list",
"signature": "+FROCExRov0I3emW4ucxNDfQvr0=",
"validLocales": [
{ "localeTag": "pt-BR", "headerRegExps": [ { "regExp": ".*(?i)(Município).*", "confidence": 90 } ] }
],
"content": {
"type": "resource",
"reference": "/reference/br_municipalities.csv"
},
"documentation": [
{ "source": "wikipedia", "reference": "https://en.wikipedia.org/wiki/Municipalities_of_Brazil" }
],
"backout": "[ \\p{IsAlphabetic}]+",
"priority": 150
},
{
"semanticType": "STATE_PROVINCE.REGION_NAME_IT",
"description": "Italian Region",
"pluginType": "list",
"signature": "B4v2+3XVmicFB1PR2TVBV6ikoig=",
"validLocales": [
{ "localeTag": "it-IT", "headerRegExps": [ { "regExp": ".*(?i)(regione).*", "confidence": 90 } ] }
],
"content": {
"type": "resource",
"reference": "/reference/it_regions.csv"
},
"documentation": [
{ "source": "wikipedia", "reference": "https://en.wikipedia.org/wiki/Regions_of_Italy" }
],
"backout": "[ \\p{IsAlphabetic}]+",
"priority": 151
},
{
"semanticType": "STATE_PROVINCE.COMMUNE_IT",
"description": "Italian Commune",
"pluginType": "list",
"signature": "3QajzO92Nvv5D9haTofNgKJ6HNo=",
"validLocales": [
{ "localeTag": "it-IT", "headerRegExps": [ { "regExp": ".*(?i)(comune|comuni).*", "confidence": 95 } ] }
],
"content": {
"type": "resource",
"reference": "/reference/it_comuni.csv"
},
"documentation": [
{ "source": "wikipedia", "reference": "https://en.wikipedia.org/wiki/Comune" }
],
"backout": "[ \\p{IsAlphabetic}]+",
"threshold": 85,
"priority": 152
},
{
"semanticType": "STATE_PROVINCE.COUNTY_HU",
"description": "Hungarian County",
"pluginType": "list",
"signature": "Cif4jZjegKgHwceZACrW5E0Vsdg=",
"validLocales": [
{ "localeTag": "hu-HU", "headerRegExps": [ { "regExp": ".*(?i)(?u)(megye).*", "confidence": 90 } ] }
],
"content": {
"type": "resource",
"reference": "/reference/hu_counties.csv"
},
"documentation": [
{ "source": "wikipedia", "reference": "https://en.wikipedia.org/wiki/Counties_of_Hungary" }
],
"backout": "[ \\p{IsAlphabetic}]+",
"priority": 153
},
{
"semanticType": "STATE_PROVINCE.COUNTY_IE",
"description": "Irish County",
"pluginType": "list",
"signature": "umrsnOd/JEy0ddIXpTD9iNBe7w8=",
"validLocales": [
{ "localeTag": "en-IE,ga-IE", "headerRegExps": [ { "regExp": ".*(?i)(county|contae).*", "confidence": 90 } ] }
],
"content": {
"type": "resource",
"reference": "/reference/ie_counties.csv"
},
"documentation": [
{ "source": "wikipedia", "reference": "https://en.wikipedia.org/wiki/Counties_of_Ireland" }
],
"backout": "[ \\p{IsAlphabetic}]+",
"priority": 154
},
{
"semanticType": "STATE_PROVINCE.PROVINCE_NAME_IE",
"description": "Irish Province",
"pluginType": "list",
"signature": "x5yTiBlrSflCR2o91jz1tILKp9c=",
"validLocales": [
{ "localeTag": "en-IE", "headerRegExps": [ { "regExp": ".*(?i)(province).*", "confidence": 90 } ] }
],
"content": {
"type": "resource",
"reference": "/reference/ie_provinces_full.csv"
},
"documentation": [
{ "source": "wikipedia", "reference": "https://en.wikipedia.org/wiki/Provinces_of_Ireland" },
{ "source": "schema", "reference": "https://schema.org/State" }
],
"backout": "[ \\p{IsAlphabetic}]+",
"priority": 155
},
{
"semanticType": "STATE_PROVINCE.MUNICIPALITY_MX",
"description": "Mexican Municipality",
"pluginType": "list",
"signature": "kepJbVnP+P/TSoxgry2mxiQFOg4=",
"validLocales": [
{ "localeTag": "es-MX", "headerRegExps": [ { "regExp": ".*(?i)(município).*", "confidence": 90 } ] }
],
"content": {
"type": "resource",
"reference": "/reference/mx_municipalities.csv"
},
"documentation": [
{ "source": "wikipedia", "reference": "https://en.wikipedia.org/wiki/Municipalities_of_Mexico" }
],
"backout": "[ \\p{IsAlphabetic}]+",
"priority": 156
},
{
"semanticType": "STATE_PROVINCE.SUBURB_AU",
"description": "Australian Suburb",
"pluginType": "java",
"signature": "VR2/cf7EOxcm7ed9eGp8A2j1fn4=",
"clazz": "com.cobber.fta.plugins.address.SuburbAU",
"validLocales": [
{ "localeTag": "en-AU", "headerRegExps": [ { "regExp": ".*(?i)(suburb).*", "confidence": 90 } ] }
],
"content": {
"type": "resource",
"reference": "/reference/au_suburbs"
},
"documentation": [
{ "source": "wikipedia", "reference": "https://en.wikipedia.org/wiki/Suburbs_and_localities_(Australia)" }
],
"backout": "[' \\p{IsAlphabetic}]+",
"priority": 157
},
{
"semanticType": "STATE_PROVINCE.MUNICIPALITY_CO",
"description": "Colombian Municipality",
"pluginType": "list",
"signature": "w7YfMi7yPXuoePHgfnM7RDyb6UE=",
"validLocales": [
{ "localeTag": "es-CO", "headerRegExps": [ { "regExp": ".*(?i)(municipio).*", "confidence": 90 } ] }
],
"content": {
"type": "resource",
"reference": "/reference/co_municipalities.csv"
},
"documentation": [
{ "source": "wikipedia", "reference": "https://en.wikipedia.org/wiki/Municipalities_of_Colombia" }
],
"backout": "[ \\p{IsAlphabetic}]+",
"priority": 158
},
{
"semanticType": "STATE_PROVINCE.DEPARTMENT_CO",
"description": "Colombian Department",
"pluginType": "list",
"signature": "V3LTco+XmMy0HMMj8+HljXecDyU=",
"validLocales": [
{ "localeTag": "es-CO", "headerRegExps": [ { "regExp": ".*(?i)(departamento).*", "confidence": 90 } ] }
],
"content": {
"type": "resource",
"reference": "/reference/co_departments.csv"
},
"documentation": [
{ "source": "wikipedia", "reference": "https://en.wikipedia.org/wiki/Departments_of_Colombia" }
],
"backout": "[ \\p{IsAlphabetic}]+",
"priority": 159
},
{
"semanticType": "STATE_PROVINCE.MUNICIPALITY_NL",
"description": "Dutch Municipality",
"pluginType": "list",
"signature": "eHt5Aj3a8lO9nvH9CeV/O3NgZZs=",
"validLocales": [
{ "localeTag": "en-NL,nl-NL", "headerRegExps": [ { "regExp": ".*(?i)(gemeente).*", "confidence": 90 } ] }
],
"content": {
"type": "resource",
"reference": "/reference/nl_municipalities.csv"
},
"documentation": [
{ "source": "wikipedia", "reference": "https://en.wikipedia.org/wiki/Municipalities_of_the_Netherlands" }
],
"backout": "[ \\p{IsAlphabetic}]+",
"priority": 160
},
{
"semanticType": "STATE_PROVINCE.MUNICIPALITY_CODE_NL",
"description": "Dutch Municipality Code",
"pluginType": "java",
"signature": "6jAs4X5jVlK2N0D0PxVkpA7+/oM=",
"clazz": "com.cobber.fta.plugins.MunicipalityCodeNL",
"validLocales": [
{ "localeTag": "en-NL,nl-NL", "headerRegExps": [ { "regExp": ".*(?i)gemeente.?(code|nummer|nr).*", "confidence": 95, "mandatory": true } ] }
],
"threshold": 95,
"priority": 161
},
{
"semanticType": "STATE_PROVINCE.REGION_NAME_PE",
"description": "Peruvian Region/Department",
"pluginType": "list",
"signature": "io6yqW4LXX2PIsoCvmxZnnPT1z8=",
"validLocales": [
{ "localeTag": "es-PE", "headerRegExps": [ { "regExp": ".*(?i)(DEPARTAMENTO).*", "confidence": 90 } ] }
],
"content": {
"type": "resource",
"reference": "/reference/pe_regions_full.csv"
},
"documentation": [
{ "source": "wikipedia", "reference": "https://en.wikipedia.org/wiki/Regions_of_Peru" }
],
"backout": "[ \\p{IsAlphabetic}]+",
"priority": 162
},
{
"semanticType": "STATE_PROVINCE.PROVINCE_NAME_PE",
"description": "Peruvian Province",
"pluginType": "list",
"signature": "Vd/g5Nd1nVYMHINBmfqo2NKh8rs=",
"validLocales": [
{ "localeTag": "es-PE", "headerRegExps": [ { "regExp": ".*(?i)(provincia).*", "confidence": 90 } ] }
],
"content": {
"type": "resource",
"reference": "/reference/pe_provinces_full.csv"
},
"documentation": [
{ "source": "wikipedia", "reference": "https://en.wikipedia.org/wiki/Provinces_of_Peru" },
{ "source": "schema", "reference": "https://schema.org/State" }
],
"backout": "[ \\p{IsAlphabetic}]+",
"priority": 163
},
{
"semanticType": "STATE_PROVINCE.REGION_NAME_TZ",
"description": "Tanzanian Region",
"pluginType": "list",
"signature": "bZbn9evDcCJHly+8OSWNQKMgy9I=",
"validLocales": [
{ "localeTag": "en-TZ,sw-TZ", "headerRegExps": [ { "regExp": ".*(?i)(region|mkoa).*", "confidence": 90 } ] }
],
"content": {
"type": "resource",
"reference": "/reference/tz_regions.csv"
},
"documentation": [
{ "source": "wikipedia", "reference": "https://en.wikipedia.org/wiki/Regions_of_Tanzania" }
],
"backout": "[ \\p{IsAlphabetic}]+",
"priority": 164
},
{
"semanticType": "STATE_PROVINCE.STATE_FIPS_US",
"description": "US State FIPS code",
"pluginType": "list",
"signature": "O8b5Lowq3YNUDncXgb6o3mbAK24=",
"validLocales": [
{ "localeTag": "en-US", "headerRegExps": [ { "regExp": ".*(?i)(fips).*", "confidence": 99, "mandatory": true } ] }
],
"content": {
"type": "resource",
"reference": "/reference/us_states_fips.csv"
},
"documentation": [
{ "source": "wikipedia", "reference": "https://en.wikipedia.org/wiki/List_of_United_States_FIPS_codes_by_county" }
],
"baseType": "LONG",
"backout": "\\d{2}",
"priority": 165
},
{
"semanticType": "STATE_PROVINCE.COUNTY_FIPS_US",
"description": "US County FIPS code",
"pluginType": "list",
"signature": "NajwouqG0A46TSthygu44kw8ZiY=",
"validLocales": [
{ "localeTag": "en-US", "headerRegExps": [ { "regExp": ".*(?i)(fips).*", "confidence": 99, "mandatory": true } ] }
],
"content": {
"type": "resource",
"reference": "/reference/us_counties_fips.csv"
},
"documentation": [
{ "source": "wikipedia", "reference": "https://en.wikipedia.org/wiki/Federal_Information_Processing_Standard_state_code" }
],
"baseType": "LONG",
"backout": "\\d{5}",
"priority": 166
},
{
"semanticType": "STATE_PROVINCE.MUNICIPALITY_CODE_BR",
"description": "Brazilian Municipality code",
"pluginType": "list",
"signature": "iLd8/9w+oQ6rSIDO2yP6kx/uJIg=",
"validLocales": [
{ "localeTag": "pt-BR", "headerRegExps": [ { "regExp": ".*(?i)(ibge).*", "confidence": 99 } ] }
],
"content": {
"type": "resource",
"reference": "/reference/br_municipalities_code.csv"
},
"documentation": [
{ "source": "wikipedia", "reference": "https://en.wikipedia.org/wiki/Municipalities_of_Brazil" }
],
"baseType": "LONG",
"backout": "\\d{7}",
"priority": 167
},
{
"semanticType": "CURRENCY_CODE.ISO-4217",
"description": "Currency as defined by ISO 4217",
"pluginType": "list",
"signature": "HElKonWFB+FY+MspBKm3eCwwrVo=",
"validLocales": [
{ "localeTag": "*", "headerRegExps": [ { "regExp": ".*4217.*", "confidence": 90 }, { "regExp": ".*(?i)(currency).*", "confidence": 70 } ] }
],
"content": {
"type": "resource",
"reference": "/reference/ISO-4217.csv"
},
"documentation": [
{ "source": "wikidata", "reference": "https://www.wikidata.org/wiki/Property:P498" },
{ "source": "wikipedia", "reference": "https://en.wikipedia.org/wiki/ISO_4217" },
{ "source": "schema", "reference": "https://schema.org/priceCurrency" }
],
"backout": "\\p{IsAlphabetic}{3}",
"priority": 170
},
{
"semanticType": "CURRENCY.TEXT_EN",
"description": "Currency Name",
"pluginType": "list",
"signature": "hp7SSeC1M4SD1q40lH1wjYzrgV8=",
"validLocales": [
{
"localeTag": "en",
"headerRegExps": [ { "regExp": ".*(?i)(currency).*", "confidence": 90 } ]
}
],
"content": {
"type": "resource",
"reference": "/reference/en_currency_full.csv"
},
"documentation": [
{ "source": "wikipedia", "reference": "https://en.wikipedia.org/wiki/Currency" }
],
"backout": "[ \\p{IsAlphabetic}]+",
"priority": 171
},
{
"semanticType": "COUNTRY.ISO-3166-3",
"description": "Country as defined by ISO 3166 - Alpha 3",
"pluginType": "list",
"signature": "WyaPkc1jgevOXlDl5bt1Za4j8ko=",
"validLocales": [
{ "localeTag": "*", "headerRegExps": [ { "regExp": ".*(?i)(iso|3166).*", "confidence": 90 }, { "regExp": ".*(?i)(country|pais|land.?code).*", "confidence": 80 } ] }
],
"content": {
"type": "resource",
"reference": "/reference/ISO-3166-3.csv"
},
"documentation": [
{ "source": "wikidata", "reference": "https://www.wikidata.org/wiki/Property:P298" },
{ "source": "wikipedia", "reference": "https://en.wikipedia.org/wiki/ISO_3166-1_alpha-3" }
],
"backout": "\\p{IsAlphabetic}{3}",
"priority": 172
},
{
"semanticType": "COUNTRY.ISO-3166-2",
"description": "Country as defined by ISO 3166 - Alpha 2",
"pluginType": "list",
"signature": "2ySMIn/48aoAVrw/OwOCKdYI4OE=",
"validLocales": [
{ "localeTag": "*", "headerRegExps": [ { "regExp": ".*(?i)(iso|3166).*", "confidence": 90, "mandatory": true }, { "regExp": ".*(?i)(country|pais|land.?code).*", "confidence": 80, "mandatory": true } ] }
],
"content": {
"type": "resource",
"reference": "/reference/ISO-3166-2.csv"
},
"documentation": [
{ "source": "wikidata", "reference": "https://www.wikidata.org/wiki/Property:P297" },
{ "source": "wikipedia", "reference": "https://en.wikipedia.org/wiki/ISO_3166-1_alpha-2" },
{ "source": "schema", "reference": "https://schema.org/eligibleRegion" }
],
"backout": "\\p{IsAlphabetic}{2}",
"priority": 173
},
{
"semanticType": "TIMEZONE.IANA",
"description": "IANA Time Zone (Olson)",
"pluginType": "list",
"signature": "AYkvNH/jCNxWHK4uLso7vEbNh5U=",
"validLocales": [
{ "localeTag": "*", "headerRegExps": [ { "regExp": ".*(?i)(timezone|olson).*", "confidence": 99 }, { "regExp": ".*(?i)(zone).*", "confidence": 90 } ] }
],
"content": {
"type": "resource",
"reference": "/reference/timezones.csv"
},
"documentation": [
{ "source": "wikidata", "reference": "https://www.wikidata.org/wiki/Property:P6687" },
{ "source": "wikipedia", "reference": "https://en.wikipedia.org/wiki/List_of_tz_database_time_zones" }
],
"backout": "[-_/A-Za-z]+",
"priority": 174
},
{
"semanticType": "CONTINENT.TEXT_EN",
"description": "Continent",
"pluginType": "list",
"signature": "LpGvbcbbeanXoAkIVobKRfMuzcg=",
"validLocales": [
{ "localeTag": "en", "headerRegExps": [ { "regExp": ".*(?i)(continent|region).*", "confidence": 90 } ] }
],
"content": {
"type": "resource",
"reference": "/reference/en_continent.csv"
},
"backout": "[ \\p{IsAlphabetic}]+",
"documentation": [
{ "source": "wikidata", "reference": "https://www.wikidata.org/wiki/Property:P30" }
],
"priority": 175
},
{
"semanticType": "CONTINENT.CODE_EN",
"description": "Continent Code",
"pluginType": "list",
"signature": "7VSVzDUptpe+9R5UafDWEwLqKs4=",
"validLocales": [
{ "localeTag": "en", "headerRegExps": [ { "regExp": ".*(?i)(continent|region).*", "confidence": 90 } ] }
],
"content": {
"type": "resource",
"reference": "/reference/en_continent_code.csv"
},
"backout": "[ \\p{IsAlphabetic}]+",
"priority": 176
},
{
"semanticType": "AIRPORT_CODE.IATA",
"description": "IATA Airport Code",
"pluginType": "list",
"signature": "yRx9nzsOl22lQTstXrT43OVBZoU=",
"validLocales": [
{
"localeTag": "*",
"headerRegExps": [ { "regExp": ".*(?i)(iata|air).*", "confidence": 99, "mandatory": true } ]
}
],
"content": {
"type": "resource",
"reference": "/reference/IATA.txt"
},
"documentation": [
{ "source": "wikipedia", "reference": "https://en.wikipedia.org/wiki/IATA_airport_code" },
{ "source": "schema", "reference": "https://schema.org/iataCode" }
],
"backout": "\\p{IsAlphabetic}{3}",
"threshold": 97,
"priority": 177
},
{
"semanticType": "AIRLINE.IATA_CODE",
"description": "IATA Airline Code",
"pluginType": "list",
"signature": "DFUIUVTe2c6xa7beZSL16iYFj2Q=",
"validLocales": [
{
"localeTag": "*",
"headerRegExps": [ { "regExp": ".*(?i)(iata|air).*", "confidence": 99, "mandatory": true } ]
}
],
"content": {
"type": "resource",
"reference": "/reference/IATA_airline.csv"
},
"documentation": [
{ "source": "wikipedia", "reference": "https://en.wikipedia.org/wiki/Airline_codes#IATA_airline_designator" },
{ "source": "schema", "reference": "https://schema.org/iataCode" }
],
"backout": "\\p{Alnum}{2}",
"threshold": 97,
"priority": 178
},
{
"semanticType": "AIRLINE.TEXT_EN",
"description": "Airline Name",
"pluginType": "list",
"signature": "pE1aMtjAkbETBURTHyhqlYPTuPQ=",
"validLocales": [
{
"localeTag": "*",
"headerRegExps": [ { "regExp": ".*(?i)(airline).*", "confidence": 99 } ]
}
],
"content": {
"type": "resource",
"reference": "/reference/en_airlines.csv"
},
"backout": "[ \\p{IsAlphabetic}]+",
"threshold": 85,
"priority": 179
},
{
"semanticType": "FILENAME",
"description": "Name of file",
"pluginType": "java",
"signature": "UkQ1ljXZ3ZmHjjp2cXuVE2gFLPw=",
"clazz": "com.cobber.fta.plugins.FileName",
"validLocales": [
{
"localeTag": "*",
"headerRegExps": [ { "regExp": ".*(?i)(file.?name).*", "confidence": 99 } ]
}
],
"documentation": [
{ "source": "wikipedia", "reference": "https://en.wikipedia.org/wiki/Filename" }
],
"priority": 180
},
{
"semanticType": "PERSON.YEAR_OF_BIRTH",
"description": "Person - Year of Birth",
"pluginType": "java",
"signature": "MwDOGFRD1CFBe0yMNQwdyIN+QQg=",
"clazz": "com.cobber.fta.plugins.person.BirthYear",
"validLocales": [
{
"localeTag": "*",
"headerRegExps": [ { "regExp": ".*(?i)(year.*birth|birth.*year).*", "confidence": 99, "mandatory": true } ]
}
],
"documentation": [
{ "source": "wikidata", "reference": "https://www.wikidata.org/wiki/Property:P569" },
{ "source": "wikidata", "reference": "https://www.wikidata.org/wiki/Q2389905" }
],
"baseType": "LOCALDATE",
"priority": 181
},
{
"semanticType": "PERSON.DATE_OF_BIRTH",
"description": "Person - Date of Birth",
"pluginType": "java",
"signature": "Z7j4EoOy8qSVaYqEGBrpSkqpwRo=",
"clazz": "com.cobber.fta.plugins.person.DOB",
"validLocales": [
{
"localeTag": "es",
"headerRegExps": [ { "regExp": ".*(?i)(fecha.*nacimiento|date.*birth|birth.*date|birthday).*", "confidence": 99, "mandatory": true } ]
},
{
"localeTag": "nl",
"headerRegExps": [ { "regExp": ".*(?i)(geboortedatum|date.*birth|birth.*date|birthday).*", "confidence": 99, "mandatory": true } ]
},
{
"localeTag": "*",
"headerRegExps": [ { "regExp": ".*(?i)(date.*birth|birth.*date|birthday).*|DOB", "confidence": 99, "mandatory": true } ]
}
],
"documentation": [
{ "source": "wikidata", "reference": "https://www.wikidata.org/wiki/Property:P569" },
{ "source": "wikidata", "reference": "https://www.wikidata.org/wiki/Q2389905" },
{ "source": "schema", "reference": "https://schema.org/birthDate" }
],
"priority": 182
},
{
"semanticType": "COORDINATE.LATITUDE_DECIMAL",
"description": "Latitude (Decimal degrees)",
"pluginType": "regex",
"signature": "5+1TLjdhcG8m3gVn0m/r6uLmh/Q=",
"validLocales": [
{
"localeTag": "*",
"headerRegExps": [ { "regExp": ".*(?i)(latitude|lattitude|[^\\p{IsAlphabetic}]lat[^\\p{IsAlphabetic}]).*|.*[^\\p{IsAlphabetic}]lat|^(lat)$|^lat[^\\p{IsAlphabetic}].*", "confidence": 99, "mandatory": true } ],
"matchEntries": [ {
"regExpsToMatch": [ "\\d*\\.?\\d+", "[+-]?\\d*\\.?\\d+" ],
"regExpReturned": "([+-]?([0-9]|[0-8][0-9])\\.\\d+)|[+-]?90\\.0+|0",
"isRegExpComplete": true
} ]
},
{
"localeTag": "ca,da,de,es,fi,fr,it,ja,nl,ro,ru,zh",
"headerRegExps": [ { "regExp": ".*(?i)(latitude|lattitude|leveysaste|breddegrad|breedtegraad|breitengrad|latitudine|latitud|Широта|緯度|[^\\p{IsAlphabetic}]lat[^\\p{IsAlphabetic}]).*|.*[^\\p{IsAlphabetic}]lat|^(lat)$|^lat[^\\p{IsAlphabetic}].*", "confidence": 99, "mandatory": true } ],
"matchEntries": [
{
"regExpsToMatch": [ "\\d*\\.?\\d+", "[+-]?\\d*\\.?\\d+" ],
"regExpReturned": "(-?([0-9]|[0-8][0-9])\\.\\d+)|-?90\\.0+",
"isRegExpComplete": true
},
{
"regExpsToMatch": [ "\\d*,?\\d+", "[+-]?\\d*,?\\d+" ],
"regExpReturned": "(-?([0-9]|[0-8][0-9]),\\d+)|-?90,0+",
"isRegExpComplete": true
} ]
}
],
"documentation": [
{ "source": "wikipedia", "reference": "https://en.wikipedia.org/wiki/Geographic_coordinate_system" },
{ "source": "wikipedia", "reference": "https://en.wikipedia.org/wiki/Latitude" },
{ "source": "wikidata", "reference": "https://www.wikidata.org/wiki/Q34027" },
{ "source": "schema", "reference": "https://schema.org/latitude" }
],
"threshold": 98,
"baseType": "DOUBLE",
"minimum": "-90.0",
"maximum": "90.0",
"priority": 190
},
{
"semanticType": "COORDINATE.LONGITUDE_DECIMAL",
"description": "Longitude (Decimal degrees)",
"pluginType": "regex",
"signature": "nDTXmMjlW1pm2Rav/0mJVPeRvKc=",
"validLocales": [
{
"localeTag": "*",
"headerRegExps": [ { "regExp": ".*(?i)(longitude|longtitude|[^\\p{IsAlphabetic}]long[^\\p{IsAlphabetic} ]).*|.*[^\\p{IsAlphabetic}](lon|long)$|^(lon|lng|long)$|^(lon|long)[^\\p{IsAlphabetic} ].*", "confidence": 99, "mandatory": true } ],
"matchEntries": [ {
"regExpsToMatch": [ "\\d*\\.?\\d+", "[+-]?\\d*\\.?\\d+", "[+-]?\\d*\\.?\\d+(?:[eE]([+-]?\\d+))?" ],
"regExpReturned": "([+-]?([0-9]|[0-9][0-9]|1[0-7][0-9])\\.\\d+)|[+-]?180\\.0+|[+-]?\\d*\\.?\\d+([eE]([+-]?\\d{1,3}))?",
"isRegExpComplete": false
} ]
},
{
"localeTag": "ca,da,de,es,fi,fr,it,ja,nl,ro,ru,zh",
"headerRegExps": [ { "regExp": ".*(?i)(?u)(longitude|pituusaste|længde|längengrad|lengtegraad|laengengrad|longitudine|longitud|Долгота|經度|[^\\p{IsAlphabetic}]long[^\\p{IsAlphabetic} ]).*|.*[^\\p{IsAlphabetic}](lon|long)$|^(lon|lng|long)$|^(lon|long)[^\\p{IsAlphabetic} ].*", "confidence": 99, "mandatory": true } ],
"matchEntries": [
{
"regExpsToMatch": [ "\\d*\\.?\\d+", "[+-]?\\d*\\.?\\d+" ],
"regExpReturned": "([+-]?([0-9]|[0-9][0-9]|1[0-7][0-9])\\.\\d+)|[+-]?180\\.0+",
"isRegExpComplete": true
},
{
"regExpsToMatch": [ "\\d*,?\\d+", "[+-]?\\d*,?\\d+" ],
"regExpReturned": "([+-]?([0-9]|[0-9][0-9]|1[0-7][0-9]),\\d+)|[+-]?180,0+",
"isRegExpComplete": true
} ]
}
],
"documentation": [
{ "source": "wikipedia", "reference": "https://en.wikipedia.org/wiki/Geographic_coordinate_system" },
{ "source": "wikipedia", "reference": "https://en.wikipedia.org/wiki/Longitude" },
{ "source": "wikidata", "reference": "https://www.wikidata.org/wiki/Q36477" },
{ "source": "schema", "reference": "https://schema.org/longitude" }
],
"threshold": 98,
"baseType": "DOUBLE",
"minimum": "-180.0",
"maximum": "180.0",
"priority": 191
},
{
"semanticType": "COORDINATE.LATITUDE_DMS",
"description": "Latitude (degrees/minutes/seconds)",
"pluginType": "java",
"signature": "DbzARuk/thlR/jm3sj8H3vllZCE=",
"clazz": "com.cobber.fta.plugins.LatitudeDMS",
"validLocales": [
{ "localeTag": "*", "headerRegExps": [ { "regExp": ".*(?i)(latitude|[^\\p{IsAlphabetic}]lat[^\\p{IsAlphabetic}]).*|(?i)(lat)", "confidence": 95 } ] }
],
"documentation": [
{ "source": "wikipedia", "reference": "https://en.wikipedia.org/wiki/Geographic_coordinate_system" },
{ "source": "wikipedia", "reference": "https://en.wikipedia.org/wiki/Latitude" },
{ "source": "schema", "reference": "https://schema.org/latitude" }
],
"threshold": 99,
"priority": 192
},
{
"semanticType": "COORDINATE.LONGITUDE_DMS",
"description": "Longitude (degrees/minutes/seconds)",
"pluginType": "java",
"signature": "uZncg/K2y6hbc3Wul8IFlpvwEEU=",
"clazz": "com.cobber.fta.plugins.LongitudeDMS",
"validLocales": [
{ "localeTag": "*", "headerRegExps": [ { "regExp": ".*(?i)(longitude|[^\\p{IsAlphabetic}]long[^\\p{IsAlphabetic}]).*|lon|lng", "confidence": 95 } ] }
],
"documentation": [
{ "source": "wikipedia", "reference": "https://en.wikipedia.org/wiki/Geographic_coordinate_system" },
{ "source": "wikipedia", "reference": "https://en.wikipedia.org/wiki/Longitude" },
{ "source": "schema", "reference": "https://schema.org/longitude" }
],
"threshold": 99,
"priority": 193
},
{
"semanticType": "COORDINATE.EASTING",
"description": "Latitude - easting",
"pluginType": "regex",
"signature": "EMjCy1d/N2KNGU3JR8XeZGAcIW0=",
"validLocales": [
{
"localeTag": "en",
"headerRegExps": [ { "regExp": ".*(?i)(easting).*", "confidence": 99, "mandatory": true } ],
"matchEntries": [ {
"regExpReturned": "\\d+",
"isRegExpComplete": true
} ]
}
],
"documentation": [
{ "source": "wikipedia", "reference": "https://en.wikipedia.org/wiki/Projected_coordinate_system" },
{ "source": "schema", "reference": "https://schema.org/latitude" }
],
"threshold": 98,
"baseType": "LONG",
"minimum": "0",
"priority": 194
},
{
"semanticType": "COORDINATE.NORTHING",
"description": "Longitude - northing",
"pluginType": "regex",
"signature": "RWgxHqDcPc9KKgzBF03YcFjzwIA=",
"validLocales": [
{
"localeTag": "en",
"headerRegExps": [ { "regExp": ".*(?i)(northing).*", "confidence": 99, "mandatory": true } ],
"matchEntries": [ {
"regExpReturned": "\\d+",
"isRegExpComplete": true
} ]
}
],
"documentation": [
{ "source": "wikipedia", "reference": "https://en.wikipedia.org/wiki/Projected_coordinate_system" },
{ "source": "schema", "reference": "https://schema.org/longitude" }
],
"threshold": 98,
"baseType": "LONG",
"minimum": "0",
"priority": 195
},
{
"semanticType": "COORDINATE_PAIR.DECIMAL",
"description": "Coordinate Pair Lat,Long - Decimal degrees",
"pluginType": "regex",
"signature": "6lVqkPqRAcyOlhHO3ckHttlzBww=",
"validLocales": [
{
"localeTag": "*",
"headerRegExps": [ { "regExp": ".*(?i)(?u)(loc|lat.*lon|lon.*lat|coord|position|geo|ubicación|koord|lokasi|posizione|Координаты|координати).*", "confidence": 99, "mandatory": true } ],
"matchEntries": [ {
"regExpsToMatch": [ "[+-]?\\d+\\.\\d+,[+-]?\\d+\\.\\d+", "[+-]?\\d+\\.\\d+, [+-]?\\d+\\.\\d+", "([+-]?\\d*\\.\\d+, [+-]?\\d*\\.\\d+)" ],
"regExpReturned": "([+-]?([0-9]|[0-8][0-9])\\.\\d+|[+-]90\\.0+), ?([+-]?([0-9]|[0-9][0-9]|1[0-7][0-9])\\.\\d+|[+-]180\\.0+)",
"isRegExpComplete": true
} ]
}
],
"documentation": [
{ "source": "wikipedia", "reference": "https://en.wikipedia.org/wiki/Geographic_coordinate_system" }
],
"threshold": 98,
"baseType": "STRING",
"priority": 196
},
{
"semanticType": "COORDINATE_PAIR.DECIMAL_PAREN",
"description": "Coordinate Pair (Lat,Long) - Decimal degrees)",
"pluginType": "regex",
"signature": "JjuOgDiwZkSPUB8AQMBLHAM1HFs=",
"validLocales": [
{
"localeTag": "*",
"headerRegExps": [ { "regExp": ".*(?i)(?u)(loc|lat.*lon|lon.*lat|coord|position|geo|ubicación|koord|lokasi|posizione|Координаты|координати).*", "confidence": 95 } ],
"matchEntries": [ {
"regExpsToMatch": [ "\\([+-]?\\d+\\.\\d+,[+-]?\\d+\\.\\d+\\)", "\\([+-]?\\d+\\.\\d+, [+-]?\\d+\\.\\d+\\)", "\\(([+-]?\\d*\\.\\d+, [+-]?\\d*\\.\\d+)\\)" ],
"regExpReturned": "\\(([+-]?([0-9]|[0-8][0-9])\\.\\d+|[+-]90\\.0+), ?([+-]?([0-9]|[0-9][0-9]|1[0-7][0-9])\\.\\d+|[+-]180\\.0+)\\)",
"isRegExpComplete": true
} ]
}
],
"documentation": [
{ "source": "wikipedia", "reference": "https://en.wikipedia.org/wiki/Geographic_coordinate_system" }
],
"threshold": 99,
"baseType": "STRING",
"priority": 197
},
{
"semanticType": "CITY",
"description": "City/Town",
"pluginType": "java",
"signature": "mz6raYadjSZxxvo+j66/fQXbhf8=",
"clazz": "com.cobber.fta.plugins.City",
"validLocales": [
{
"localeTag": "de",
"headerRegExps": [ { "regExp": "^(?i)(ort)$", "confidence": 99, "mandatory": true } ]
},
{
"localeTag": "en",
"headerRegExps": [
{ "regExp": "^(?i).*(ethnicity).*", "confidence": -1, "mandatory": true },
{ "regExp": "^(?i)(city|town)$", "confidence": 99, "mandatory": true },
{ "regExp": "^(?i).*[ _](city|town)$|^(city|town)[ _]name$|(?-i).*[a-z](City|Town)$", "confidence": 95, "mandatory": true },
{ "regExp": "^(?i).*(city|town)$", "confidence": 75, "mandatory": true }
]
},
{
"localeTag": "es",
"headerRegExps": [ { "regExp": "^(?i)(ciudad)$", "confidence": 99, "mandatory": true } ]
},
{
"localeTag": "fr",
"headerRegExps": [ { "regExp": "^(?i)(ville)$", "confidence": 99, "mandatory": true } ]
},
{
"localeTag": "nl",
"headerRegExps": [ { "regExp": "^(?i)(plaats|woonplaats|woonplaatsnaam|wijk|wijknaam|buurt|buurtnaam)$", "confidence": 99, "mandatory": true } ]
}
],
"content": {
"type": "resource",
"reference": "/reference/en_city_samples.csv"
},
"documentation": [
{ "source": "wikipedia", "reference": "https://en.wikipedia.org/wiki/City" },
{ "source": "schema", "reference": "https://schema.org/City" }
],
"baseType": "STRING",
"priority": 210
},
{
"semanticType": "CREDIT_CARD_TYPE",
"description": "Type of Credit CARD - e.g. AMEX, VISA, ...",
"pluginType": "list",
"signature": "QzgdMpiIKP3sFI8FS6u3taAuRK4=",
"validLocales": [
{ "localeTag": "*", "headerRegExps": [ { "regExp": ".*(?i)(credit|card).*", "confidence": 90 }, { "regExp": ".*(?i)(credit|card).*", "confidence": 70 } ] }
],
"content": {
"type": "resource",
"reference": "/reference/CCType.csv"
},
"documentation": [
{ "source": "wikipedia", "reference": "https://en.wikipedia.org/wiki/Credit_card" },
{ "source": "schema", "reference": "https://schema.org/CreditCard" }
],
"backout": "[ \\p{Alpha}]+",
"priority": 220
},
{
"semanticType": "SSN",
"description": "Social Security Number (US)",
"pluginType": "java",
"signature": "SaJgghJaa44guUQ5oMO6woNkWac=",
"clazz": "com.cobber.fta.plugins.identity.SSN_US",
"validLocales": [
{
"localeTag": "en-US",
"headerRegExps": [ { "regExp": ".*(?i)(SSN).*", "confidence": 90 }, { "regExp": ".*(?i)(Social).*", "confidence": 70 } ]
}
],
"documentation": [
{ "source": "wikipedia", "reference": "https://en.wikipedia.org/wiki/Social_Security_number" }
],
"threshold": 98,
"priority": 225
},
{
"semanticType": "IDENTITY.EIN_US",
"description": "Employer Identification Number (US)",
"pluginType": "java",
"signature": "XwD3tlpcRPsH1AXfYE5z7XPvrjA=",
"clazz": "com.cobber.fta.plugins.identity.EIN",
"validLocales": [
{
"localeTag": "en-US",
"headerRegExps": [ { "regExp": ".*(?i)(EIN).*", "confidence": 95 }, { "regExp": ".*(?i)(Tax|Employer).*", "confidence": 70 } ]
}
],
"documentation": [
{ "source": "wikidata", "reference": "https://www.wikidata.org/wiki/Property:P1297" },
{ "source": "wikipedia", "reference": "https://en.wikipedia.org/wiki/Employer_Identification_Number" }
],
"threshold": 98,
"baseType": "STRING",
"priority": 226
},
{
"semanticType": "IDENTITY.PERSONNUMMER_SE",
"description": "Personal identity number (Sweden)",
"pluginType": "java",
"signature": "lBrcRccn22VRzUfFCmzK2pGDehE=",
"clazz": "com.cobber.fta.plugins.identity.Personnummer_SE",
"validLocales": [
{ "localeTag": "sv-SE", "headerRegExps": [ { "regExp": ".*(?i)(personnummer)", "confidence": 95 } ] }
],
"documentation": [
{ "source": "wikipedia", "reference": "https://en.wikipedia.org/wiki/Personal_identity_number_(Sweden)" }
],
"threshold": 98,
"priority": 230
},
{
"semanticType": "IDENTITY.SSN_FR",
"description": "Social Security Number (France)",
"pluginType": "java",
"signature": "XfMSrETk0IIuromCYEfRy+k212s=",
"clazz": "com.cobber.fta.plugins.identity.SSN_FR",
"validLocales": [
{ "localeTag": "fr-FR", "headerRegExps": [ { "regExp": ".*(?i)(SSN)", "confidence": 95 } ] }
],
"documentation": [
{ "source": "wikidata", "reference": "https://www.wikidata.org/wiki/Property:P374" },
{ "source": "wikipedia", "reference": "https://en.wikipedia.org/wiki/INSEE_code" }
],
"threshold": 98,
"priority": 231
},
{
"semanticType": "IDENTITY.INDIVIDUAL_NUMBER_JA",
"description": "Individual Number / My Number (Japan)",
"pluginType": "java",
"signature": "E4/GpH4/SwmWNCLlNswUgL6qWBU=",
"clazz": "com.cobber.fta.plugins.identity.IN_JA",
"validLocales": [
{ "localeTag": "ja", "headerRegExps": [ { "regExp": ".*(?i)(Individual Number|My Number|個人番号|マイナンバー|kojin bangō|mai nambā)", "confidence": 95 } ] }
],
"documentation": [
{ "source": "wikipedia", "reference": "https://en.wikipedia.org/wiki/Individual_Number" }
],
"threshold": 98,
"priority": 232
},
{
"semanticType": "IDENTITY.SSN_CH",
"description": "AVH Number / SSN (Switzerland)",
"pluginType": "java",
"signature": "JuS68p5mp6n2dvAxNDEuS7S4f9U=",
"clazz": "com.cobber.fta.plugins.identity.SSN_CH",
"validLocales": [
{ "localeTag": "de-CH,fr-CH,it-CH", "headerRegExps": [ { "regExp": ".*(?i)(AVH|SSN|Sozialversicherungsnummer)", "confidence": 95 } ] }
],
"documentation": [
{ "source": "wikipedia", "reference": "https://en.wikipedia.org/wiki/National_identification_number#Switzerland" }
],
"threshold": 98,
"priority": 233
},
{
"semanticType": "IDENTITY.AADHAAR_IN",
"description": "Aadhaar (India)",
"pluginType": "java",
"signature": "X+ml1qaeW0taw3RfNRky+4Ifg88=",
"clazz": "com.cobber.fta.plugins.identity.Aadhaar_IN",
"validLocales": [
{ "localeTag": "en-IN", "headerRegExps": [ { "regExp": ".*(?i)(Aadhar|Aadhaar)", "confidence": 95 } ] }
],
"documentation": [
{ "source": "wikipedia", "reference": "https://en.wikipedia.org/wiki/Aadhaar" }
],
"threshold": 98,
"priority": 234
},
{
"semanticType": "IDENTITY.BSN_NL",
"description": "BSN (Netherlands)",
"pluginType": "java",
"signature": "7Q98Lrd+aZrOHv6KdG81YGOV4fk=",
"clazz": "com.cobber.fta.plugins.identity.BSN_NL",
"validLocales": [
{ "localeTag": "en-NL,nl-NL", "headerRegExps": [ { "regExp": ".*(?i)(BSN)", "confidence": 95 } ] }
],
"documentation": [
{ "source": "wikipedia", "reference": "https://en.wikipedia.org/wiki/National_identification_number#Netherlands" }
],
"threshold": 98,
"priority": 235
},
{
"semanticType": "IDENTITY.NHS_UK",
"description": "NHS (UK)",
"pluginType": "java",
"signature": "CftIkR8ZKJb0EsTdGaP4WzBW4/c=",
"clazz": "com.cobber.fta.plugins.identity.NHS_UK",
"validLocales": [
{ "localeTag": "en-GB,en-UK", "headerRegExps": [ { "regExp": ".*(?i)(NHS)", "confidence": 95 } ] }
],
"documentation": [
{ "source": "wikipedia", "reference": "https://en.wikipedia.org/wiki/NHS_number" }
],
"threshold": 98,
"priority": 236
},
{
"semanticType": "IDENTITY.NI_UK",
"description": "National Insurance Number (UK)",
"pluginType": "java",
"signature": "Q+g0UIYDCi5HMGM64y1jNs9LBdw=",
"clazz": "com.cobber.fta.plugins.identity.NI_UK",
"validLocales": [
{ "localeTag": "en-GB,en-UK", "headerRegExps": [ { "regExp": "(?i)(NI|NINO|.*National.?Insurance.*)", "confidence": 95 } ] }
],
"documentation": [
{ "source": "wikipedia", "reference": "https://en.wikipedia.org/wiki/National_Insurance_number" }
],
"threshold": 98,
"priority": 237
},
{
"semanticType": "IDENTITY.NPI_US",
"description": "National Provider Identifier (US)",
"pluginType": "java",
"signature": "x+p/BP9gCPuonINo01fu324kuvE=",
"clazz": "com.cobber.fta.plugins.identity.NPI_US",
"validLocales": [
{ "localeTag": "en-US", "headerRegExps": [ { "regExp": "(?i)(NPI|national.?provider.?identifier)", "confidence": 95 } ] }
],
"documentation": [
{ "source": "wikipedia", "reference": "https://en.wikipedia.org/wiki/National_Provider_Identifier" }
],
"baseType": "LONG",
"priority": 238
},
{
"semanticType": "IDENTITY.DUNS",
"description": "Data Universal Numbering System (Dun & Bradstreet)",
"pluginType": "regex",
"signature": "DMFnAAIxAV3SYWq07h/9U2S8IVo=",
"validLocales": [
{
"localeTag": "*",
"headerRegExps": [ { "regExp": ".*(DUNS|D-U-N-S).*", "confidence": 99, "mandatory": true } ],
"matchEntries": [ {
"regExpReturned": "\\d{9}",
"isRegExpComplete": false
} ]
}
],
"documentation": [
{ "source": "wikidata", "reference": "https://www.wikidata.org/wiki/Property:P2771" },
{ "source": "wikipedia", "reference": "https://en.wikipedia.org/wiki/Data_Universal_Numbering_System" },
{ "source": "schema", "reference": "https://schema.org/duns" }
],
"baseType": "LONG",
"priority": 239
},
{
"semanticType": "IDENTITY.VAT_",
"description": "VAT",
"pluginType": "java",
"signature": "[NONE]",
"clazz": "com.cobber.fta.plugins.identity.VAT",
"validLocales": [
{ "localeTag": "en-GB,en-UK", "headerRegExps": [ { "regExp": ".*(?i)(VAT).*", "confidence": 95, "mandatory": true } ] },
{ "localeTag": "it-IT", "headerRegExps": [ { "regExp": ".*(?i)(IVA).*", "confidence": 95, "mandatory": true } ] },
{ "localeTag": "es-ES,ca-ES", "headerRegExps": [ { "regExp": ".*(?i)(NIF|CIF).*", "confidence": 95, "mandatory": true } ] },
{ "localeTag": "en-NL,nl-NL", "headerRegExps": [ { "regExp": ".*(?i)(BTW).*", "confidence": 95, "mandatory": true } ] },
{ "localeTag": "pl-PL", "headerRegExps": [ { "regExp": ".*(?i)(NIP).*", "confidence": 95, "mandatory": true } ] },
{ "localeTag": "de-AT", "headerRegExps": [ { "regExp": "(?i)(UID)", "confidence": 95, "mandatory": true } ] },
{ "localeTag": "fr-FR", "headerRegExps": [ { "regExp": "(?i)(TVA)", "confidence": 95, "mandatory": true } ] }
],
"documentation": [
{ "source": "wikidata", "reference": "https://www.wikidata.org/wiki/Property:P3608" },
{ "source": "wikipedia", "reference": "https://en.wikipedia.org/wiki/Value-added_tax" }
],
"threshold": 95,
"priority": 240
},
{
"semanticType": "LANGUAGE.ISO-639-2",
"description": "Language code - ISO 639, three character",
"pluginType": "list",
"signature": "oh7DsTF4qDUm+o+JPy7jAIoU+1Y=",
"validLocales": [
{ "localeTag": "*", "headerRegExps": [ { "regExp": ".*(?i)(language|lingua|639|3066).*", "confidence": 90 }, { "regExp": ".*(?i)(lang).*", "confidence": 60 } ] }
],
"content": {
"type": "resource",
"reference": "/reference/ISO-639-2.csv"
},
"documentation": [
{ "source": "wikidata", "reference": "https://www.wikidata.org/wiki/Property:P219" },
{ "source": "wikipedia", "reference": "https://en.wikipedia.org/wiki/ISO_639-2" }
],
"backout": "\\p{IsAlphabetic}{2}",
"priority": 245
},
{
"semanticType": "LANGUAGE.ISO-639-1",
"description": "Language code - ISO 639, two character",
"pluginType": "list",
"signature": "5f6VjpTf8QQ4BjI0GVI1e7z9o3U=",
"validLocales": [
{ "localeTag": "*", "headerRegExps": [ { "regExp": ".*(?i)(language|lingua|639|3066).*", "confidence": 90 }, { "regExp": ".*(?i)(lang).*", "confidence": 60 } ] }
],
"content": {
"type": "resource",
"reference": "/reference/ISO-639-1.csv"
},
"documentation": [
{ "source": "wikidata", "reference": "https://www.wikidata.org/wiki/Property:P218" },
{ "source": "wikipedia", "reference": "https://en.wikipedia.org/wiki/ISO_639-1" }
],
"backout": "\\p{IsAlphabetic}{3}",
"priority": 246
},
{
"semanticType": "LANGUAGE.TEXT_EN",
"description": "Language name, e.g. English, French, ...",
"pluginType": "list",
"pluginOptions": "words=all",
"signature": "XCjtEvkiEs1eLR9wqzgkxxgosg0=",
"validLocales": [
{
"localeTag": "en",
"headerRegExps": [ { "regExp": ".*(?i)(language).*", "confidence": 90 } ],
"matchEntries": [ {
"regExpReturned": "[-' \\p{IsAlphabetic}]+"
} ]
}
],
"content": {
"type": "resource",
"reference": "/reference/en_language.csv"
},
"backout": "[\\p{Alpha}]+",
"priority": 250
},
{
"semanticType": "MACADDRESS",
"description": "MAC Address",
"pluginType": "regex",
"signature": "QIZNObx4ycNBImDb7esJCP1YrOs=",
"validLocales": [
{
"localeTag": "*",
"headerRegExps": [ { "regExp": ".*(?i)(MAC).*", "confidence": 90 } ],
"matchEntries": [
{
"regExpsToMatch": [ "\\p{XDigit}{2}:\\p{XDigit}{2}:\\p{XDigit}{2}:\\p{XDigit}{2}:\\p{XDigit}{2}:\\p{XDigit}{2}" ],
"regExpReturned": "\\p{XDigit}{2}:\\p{XDigit}{2}:\\p{XDigit}{2}:\\p{XDigit}{2}:\\p{XDigit}{2}:\\p{XDigit}{2}",
"isRegExpComplete": true
},
{
"regExpsToMatch": [ "\\p{XDigit}{2}-\\p{XDigit}{2}-\\p{XDigit}{2}-\\p{XDigit}{2}-\\p{XDigit}{2}-\\p{XDigit}{2}" ],
"regExpReturned": "\\p{XDigit}{2}-\\p{XDigit}{2}-\\p{XDigit}{2}-\\p{XDigit}{2}-\\p{XDigit}{2}-\\p{XDigit}{2}",
"isRegExpComplete": true
}
]
}
],
"documentation": [
{ "source": "wikipedia", "reference": "https://en.wikipedia.org/wiki/MAC_address" }
],
"threshold": 98,
"baseType": "STRING",
"priority": 260
},
{
"semanticType": "MONTH.DIGITS",
"description": "Numeric Month",
"pluginType": "java",
"signature": "dFlMU1F4av5mccH3zIeKaRe67SY=",
"clazz": "com.cobber.fta.plugins.MonthDigits",
"validLocales": [
{
"localeTag": "en",
"headerRegExps": [ { "regExp": ".*(?i)(month|month.?number)|(i?)(month|month.?number).*", "confidence": 99, "mandatory": true } ]
},
{
"localeTag": "es",
"headerRegExps": [ { "regExp": ".*(?i)(mes)|(i?)(mes).*", "confidence": 99, "mandatory": true } ]
},
{
"localeTag": "nl",
"headerRegExps": [ { "regExp": ".*(?i)(maand)|(i?)(maand).*", "confidence": 99, "mandatory": true } ]
}
],
"threshold": 98,
"baseType": "LONG",
"priority": 270
},
{
"semanticType": "DAY.DIGITS",
"description": "Numeric Day of Month",
"pluginType": "java",
"signature": "1C6IAjixbGXDfrkL4dEndXg65BQ=",
"clazz": "com.cobber.fta.plugins.DayDigits",
"validLocales": [
{
"localeTag": "en",
"headerRegExps": [
{ "regExp": "(?i)day", "confidence": 99, "mandatory": true },
{ "regExp": ".*(?i)(day|cycle).*", "confidence": 90, "mandatory": true }
]
},
{
"localeTag": "es",
"headerRegExps": [
{ "regExp": "(?i)(?u)(día|dia[_ ].*)", "confidence": 99, "mandatory": true }
]
},
{
"localeTag": "nl",
"headerRegExps": [
{ "regExp": "(?i)dag", "confidence": 99, "mandatory": true }
]
}
],
"threshold": 98,
"baseType": "LONG",
"priority": 271
},
{
"semanticType": "EPOCH.SECONDS",
"description": "Unix Epoch (Timestamp) - seconds",
"pluginType": "java",
"signature": "SDOVIb658Bu1vG5h1htbJj0PMqg=",
"clazz": "com.cobber.fta.plugins.EpochSeconds",
"validLocales": [
{
"localeTag": "*",
"headerRegExps": [
{ "regExp": ".*(?i)(timestamp|_ts).*", "confidence": 99, "mandatory": true },
{ "regExp": ".*(?i)(time|date).*", "confidence": 85, "mandatory": true }
],
"matchEntries": [ {
"regExpReturned": "\\d{10}",
"isRegExpComplete": false
} ]
}
],
"documentation": [
{ "source": "wikipedia", "reference": "https://en.wikipedia.org/wiki/Unix_time" }
],
"threshold": 99,
"baseType": "LONG",
"priority": 272
},
{
"semanticType": "EPOCH.MILLISECONDS",
"description": "Unix Epoch (Timestamp) - milliseconds",
"pluginType": "java",
"signature": "viRZbKzQgIqtkppDhoCbAFLXEag=",
"clazz": "com.cobber.fta.plugins.EpochMilliseconds",
"validLocales": [
{
"localeTag": "*",
"headerRegExps": [
{ "regExp": ".*(?i)(timestamp|_ts).*", "confidence": 99, "mandatory": true },
{ "regExp": ".*(?i)(time|date).*", "confidence": 85, "mandatory": true }
],
"matchEntries": [ {
"regExpReturned": "\\d{13}",
"isRegExpComplete": false
} ]
}
],
"documentation": [
{ "source": "wikipedia", "reference": "https://en.wikipedia.org/wiki/Unix_time" }
],
"threshold": 99,
"baseType": "LONG",
"priority": 273
},
{
"semanticType": "IMEI",
"description": "International Mobile Equipment Identity",
"pluginType": "java",
"signature": "QPHqJewHLBbpUTGQg7hc1+Zzu/g=",
"clazz": "com.cobber.fta.plugins.IMEI",
"validLocales": [ { "localeTag": "*", "headerRegExps": [ { "regExp": ".*(?i)(imei).*", "confidence": 99, "mandatory": true } ] } ],
"documentation": [
{ "source": "wikipedia", "reference": "https://en.wikipedia.org/wiki/International_Mobile_Equipment_Identity" }
],
"baseType": "LONG",
"priority": 289
},
{
"semanticType": "CHECKDIGIT.LUHN",
"description": "LUHN Checkdigit (Credit Cards, IMEI, etc)",
"pluginType": "java",
"signature": "ySEbGrpJCO/yoMiVxyK5vi9sBtU=",
"clazz": "com.cobber.fta.plugins.CheckDigitLuhn",
"validLocales": [ { "localeTag": "*" } ],
"documentation": [
{ "source": "wikipedia", "reference": "https://en.wikipedia.org/wiki/Luhn_algorithm" }
],
"baseType": "LONG",
"priority": 290
},
{
"semanticType": "CHECKDIGIT.CUSIP",
"description": "CUSIP - North American Security Identifiers",
"pluginType": "java",
"signature": "4EK6Y3hBd2en5Hm9EUKnVbrUjlM=",
"clazz": "com.cobber.fta.plugins.CheckDigitCUSIP",
"validLocales": [
{
"localeTag": "*",
"matchEntries": [ {
"regExpReturned": "[\\p{IsAlphabetic}\\d]{9}"
} ]
}
],
"documentation": [
{ "source": "wikipedia", "reference": "https://en.wikipedia.org/wiki/CUSIP" }
],
"priority": 291
},
{
"semanticType": "CHECKDIGIT.SEDOL",
"description": "SEDOL - UK Security Identifiers",
"pluginType": "java",
"signature": "A6zVzMb8GxHKIRvQeHJYY2mUqV0=",
"clazz": "com.cobber.fta.plugins.CheckDigitSEDOL",
"validLocales": [ { "localeTag": "*" } ],
"documentation": [
{ "source": "wikipedia", "reference": "https://en.wikipedia.org/wiki/SEDOL" }
],
"priority": 292
},
{
"semanticType": "CHECKDIGIT.ISIN",
"description": "ISIN - International Securities Identification Number",
"pluginType": "java",
"signature": "ROIyMHsrinw2O/REk9ClAb0WUEs=",
"clazz": "com.cobber.fta.plugins.CheckDigitISIN",
"validLocales": [ { "localeTag": "*" } ],
"documentation": [
{ "source": "wikidata", "reference": "https://www.wikidata.org/wiki/Property:P946" },
{ "source": "wikipedia", "reference": "https://en.wikipedia.org/wiki/International_Securities_Identification_Number" }
],
"priority": 293
},
{
"semanticType": "CHECKDIGIT.EAN13",
"description": "EAN-13 - EAN-13/ISBN-13 Check digit",
"pluginType": "java",
"signature": "AP6Bjl97rR4D1ogsqPqXGoD5Dq4=",
"clazz": "com.cobber.fta.plugins.CheckDigitEAN13",
"validLocales": [ { "localeTag": "*" } ],
"documentation": [
{ "source": "wikidata", "reference": "https://www.wikidata.org/wiki/Property:P212" },
{ "source": "wikipedia", "reference": "https://en.wikipedia.org/wiki/ISBN" },
{ "source": "schema", "reference": "https://schema.org/gtin13" }
],
"baseType": "LONG",
"priority": 294
},
{
"semanticType": "CHECKDIGIT.UPC",
"description": "UPC - Universal Product Code",
"pluginType": "java",
"signature": "L88o6zYDCyR84UYMe+O/ua0Kfcg=",
"clazz": "com.cobber.fta.plugins.CheckDigitUPC",
"validLocales": [ { "localeTag": "*" } ],
"documentation": [
{ "source": "wikipedia", "reference": "https://en.wikipedia.org/wiki/Universal_Product_Code" }
],
"baseType": "LONG",
"priority": 295
},
{
"semanticType": "CHECKDIGIT.IBAN",
"description": "IBAN - International Bank Account Number",
"pluginType": "java",
"signature": "ahEtumk3vTi+ErbmmqrmBN7OeVU=",
"clazz": "com.cobber.fta.plugins.CheckDigitIBAN",
"validLocales": [ { "localeTag": "*" } ],
"documentation": [
{ "source": "wikipedia", "reference": "https://en.wikipedia.org/wiki/International_Bank_Account_Number" }
],
"priority": 296
},
{
"semanticType": "CHECKDIGIT.ABA",
"description": "ABA Number (or Routing Transit Number (RTN))",
"pluginType": "java",
"signature": "z/uWdWQDM6Ln80wNSIshhGV5et4=",
"clazz": "com.cobber.fta.plugins.CheckDigitABA",
"validLocales": [ { "localeTag": "*" } ],
"documentation": [
{ "source": "wikipedia", "reference": "https://en.wikipedia.org/wiki/ABA_routing_transit_number" }
],
"baseType": "LONG",
"priority": 297
},
{
"semanticType": "CHECKDIGIT.ISBN",
"description": "ISBN-13 identifiers (with hyphens)",
"pluginType": "java",
"signature": "4ZyGddBdufT5msMx8IyO5ZJP30s=",
"clazz": "com.cobber.fta.plugins.CheckDigitISBN",
"validLocales": [ { "localeTag": "*" } ],
"documentation": [
{ "source": "wikipedia", "reference": "https://en.wikipedia.org/wiki/ISBN" },
{ "source": "schema", "reference": "https://schema.org/isbn" }
],
"priority": 298
},
{
"semanticType": "JOB_TITLE_EN",
"description": "Job Title/Occupation (English Language)",
"pluginType": "java",
"signature": "6IKfzTa++cfQDm7aehEqSaJ/rek=",
"clazz": "com.cobber.fta.plugins.JobTitleEN",
"validLocales": [
{ "localeTag": "en", "headerRegExps": [ { "regExp": ".*(?i)(job.title).*", "confidence": 99 }, { "regExp": ".*(?i)(title|position|occupation|profession|role).*", "confidence": 90 } ] }
],
"documentation": [
{ "source": "wikipedia", "reference": "https://en.wikipedia.org/wiki/Work_(human_activity)" },
{ "source": "schema", "reference": "https://schema.org/jobTitle" },
{ "source": "schema", "reference": "https://schema.org/title" }
],
"threshold": 60,
"priority": 300
},
{
"semanticType": "INDUSTRY_EN",
"description": "Industry Name",
"pluginType": "java",
"signature": "j2TOVT5j9M0DIQyTrwOdB71iZdA=",
"clazz": "com.cobber.fta.plugins.IndustryEN",
"validLocales": [
{ "localeTag": "*", "headerRegExps": [ { "regExp": "(?i)(industry)", "confidence": 99, "mandatory": true }, { "regExp": ".*(?i)(industry|naics).*", "confidence": 90, "mandatory": true } ] }
],
"priority": 301
},
{
"semanticType": "HASH.SHA1_HEX",
"description": "SHA1 Hash - hexadecimal",
"pluginType": "regex",
"signature": "N4sH+cysuswY590FSnqXWIn0e3k=",
"validLocales": [
{
"localeTag": "*",
"headerRegExps": [ { "regExp": ".*(?i)(SHA1|hash).*", "confidence": 99 } ],
"matchEntries": [ {
"regExpReturned": "\\p{XDigit}{40}",
"isRegExpComplete": true
} ]
}
],
"documentation": [
{ "source": "wikipedia", "reference": "https://en.wikipedia.org/wiki/SHA-1" }
],
"threshold": 99,
"baseType": "STRING",
"priority": 302
},
{
"semanticType": "HASH.SHA256_HEX",
"description": "SHA256 Hash - hexadecimal",
"pluginType": "regex",
"signature": "D+loPv6WvUlbi28kW3z7tVJ40N4=",
"validLocales": [
{
"localeTag": "*",
"headerRegExps": [ { "regExp": ".*(?i)(SHA256|hash).*", "confidence": 99 } ],
"matchEntries": [ {
"regExpReturned": "\\p{XDigit}{64}",
"isRegExpComplete": true
} ]
}
],
"documentation": [
{ "source": "wikipedia", "reference": "https://en.wikipedia.org/wiki/SHA-2" }
],
"threshold": 99,
"baseType": "STRING",
"priority": 303
},
{
"semanticType": "COLOR.HEX",
"description": "Hex Color code",
"pluginType": "regex",
"signature": "HX3ks449m2szm58Mj0TNb+W8e0A=",
"validLocales": [
{
"localeTag": "*",
"headerRegExps": [ { "regExp": ".*(?i)(color|colour).*", "confidence": 90 } ],
"matchEntries": [ {
"regExpReturned": "#\\p{XDigit}{6}",
"isRegExpComplete": true
} ]
}
],
"threshold": 99,
"documentation": [
{ "source": "wikidata", "reference": "https://www.wikidata.org/wiki/Property:P465" },
{ "source": "wikipedia", "reference": "https://en.wikipedia.org/wiki/Web_colors" },
{ "source": "schema", "reference": "https://schema.org/color" }
],
"baseType": "STRING",
"priority": 304
},
{
"semanticType": "COLOR.TEXT_EN",
"description": "Color name (English)",
"pluginType": "list",
"pluginOptions": "words=all",
"signature": "CIsljBWEmutE4EulPJgCkQZyzMU=",
"validLocales": [
{ "localeTag": "*", "headerRegExps": [ { "regExp": ".*(?i)(color|colour).*", "confidence": 90 } ] }
],
"ignoreList": [ "N/A", "OTHER" ],
"content": {
"type": "resource",
"reference": "/reference/en_color.csv"
},
"documentation": [
{ "source": "wikidata", "reference": "https://www.wikidata.org/wiki/Property:P462" },
{ "source": "wikipedia", "reference": "https://en.wikipedia.org/wiki/Web_colors" },
{ "source": "schema", "reference": "https://schema.org/color" }
],
"backout": "[ \\p{IsAlphabetic}]+",
"priority": 305
},
{
"semanticType": "COLOR.TEXT_NL",
"description": "Color name (Dutch)",
"pluginType": "list",
"pluginOptions": "words=all",
"signature": "+WrxpZvBxXNUyWInyd9r2FadhuY=",
"validLocales": [
{ "localeTag": "nl", "headerRegExps": [ { "regExp": ".*(?i)(kleur).*", "confidence": 90, "mandatory": true } ] }
],
"ignoreList": [ "NVT" ],
"content": {
"type": "resource",
"reference": "/reference/nl_color.csv"
},
"documentation": [
{ "source": "wikidata", "reference": "https://www.wikidata.org/wiki/Property:P462" },
{ "source": "wikipedia", "reference": "https://en.wikipedia.org/wiki/Web_colors" },
{ "source": "schema", "reference": "https://schema.org/color" }
],
"backout": "[ \\p{IsAlphabetic}]+",
"priority": 306
},
{
"semanticType": "COLOR.TEXT_ES",
"description": "Color name (Spanish)",
"pluginType": "list",
"pluginOptions": "words=all",
"signature": "I2y3yXfuj8RTGMSr6exv3TnPWoE=",
"validLocales": [
{ "localeTag": "es", "headerRegExps": [ { "regExp": ".*(?i)(color).*", "confidence": 90, "mandatory": true } ] }
],
"content": {
"type": "resource",
"reference": "/reference/es_color.csv"
},
"documentation": [
{ "source": "wikidata", "reference": "https://www.wikidata.org/wiki/Property:P462" },
{ "source": "wikipedia", "reference": "https://en.wikipedia.org/wiki/Web_colors" },
{ "source": "schema", "reference": "https://schema.org/color" }
],
"backout": "[ \\p{IsAlphabetic}]+",
"priority": 306
},
{
"semanticType": "DIRECTION",
"description": "Cardinal Direction",
"pluginType": "java",
"signature": "eQbFEkaZaWJM4Quexoibt1QJsnw=",
"clazz": "com.cobber.fta.plugins.Direction",
"validLocales": [
{ "localeTag": "*", "headerRegExps": [ { "regExp": ".*(?i)(direction).*", "confidence": 99 },
{ "regExp": ".*(?i)(dir|suffix|prefix).*", "confidence": 90 } ] }
],
"documentation": [
{ "source": "wikipedia", "reference": "https://en.wikipedia.org/wiki/Cardinal_direction" }
],
"baseType": "STRING",
"priority": 310
},
{
"semanticType": "INDUSTRY_CODE.NAICS",
"description": "Industry Code - NAICS",
"pluginType": "java",
"signature": "i2DkepwVwjhGYOf7BbaemLrr1GI=",
"clazz": "com.cobber.fta.plugins.IndustryNAICS",
"validLocales": [
{ "localeTag": "en-US,en-CA,en-MX,es-MX,fr-CA", "headerRegExps": [ { "regExp": ".*(?i)(naics.?code).*", "confidence": 99, "mandatory": true }, { "regExp": ".*(?i)(naics).*", "confidence": 90, "mandatory": true } ] }
],
"documentation": [
{ "source": "wikidata", "reference": "https://www.wikidata.org/wiki/Property:P3224" },
{ "source": "wikipedia", "reference": "https://en.wikipedia.org/wiki/North_American_Industry_Classification_System" },
{ "source": "schema", "reference": "https://schema.org/naics" }
],
"baseType": "LONG",
"priority": 311
},
{
"semanticType": "NAME.LAST_FIRST",
"description": "Merged Name (Last, First)",
"pluginType": "java",
"signature": "WlXF9TSnYBDQXbOMhceVK9XCxAk=",
"clazz": "com.cobber.fta.plugins.NameLastFirst",
"validLocales": [
{ "localeTag": "en", "headerRegExps": [ { "regExp": ".*(?i)(name|contact|author).*", "confidence": 60 } ] },
{ "localeTag": "de", "headerRegExps": [ { "regExp": ".*(?i)(name).*", "confidence": 60 } ] },
{ "localeTag": "es", "headerRegExps": [ { "regExp": ".*(?i)(nombre).*", "confidence": 60 } ] },
{ "localeTag": "fr", "headerRegExps": [ { "regExp": ".*(?i)(nom).*", "confidence": 60 } ] },
{ "localeTag": "it", "headerRegExps": [ { "regExp": ".*(?i)(nome).*", "confidence": 60 } ] },
{ "localeTag": "nl", "headerRegExps": [ { "regExp": ".*(?i)(naam).*", "confidence": 60 } ] },
{ "localeTag": "pt", "headerRegExps": [ { "regExp": ".*(?i)(nome).*", "confidence": 60 } ] }
],
"documentation": [
{ "source": "wikipedia", "reference": "https://en.wikipedia.org/wiki/Personal_name" }
],
"threshold": 90,
"priority": 370
},
{
"semanticType": "NAME.FIRST_LAST",
"description": "Merged Name (First Last)",
"pluginType": "java",
"signature": "pJJS+kSfyNDRb2T7SXIWhZhlH3c=",
"clazz": "com.cobber.fta.plugins.NameFirstLast",
"validLocales": [
{ "localeTag": "en", "headerRegExps": [ { "regExp": ".*(?i)(name|contact|author).*", "confidence": 60 } ] },
{ "localeTag": "de", "headerRegExps": [ { "regExp": ".*(?i)(name).*", "confidence": 60 } ] },
{ "localeTag": "es", "headerRegExps": [ { "regExp": ".*(?i)(nombre).*", "confidence": 60 } ] },
{ "localeTag": "fr", "headerRegExps": [ { "regExp": ".*(?i)(nom).*", "confidence": 60 } ] },
{ "localeTag": "it", "headerRegExps": [ { "regExp": ".*(?i)(nome).*", "confidence": 60 } ] },
{ "localeTag": "nl", "headerRegExps": [ { "regExp": ".*(?i)(naam).*", "confidence": 60 } ] },
{ "localeTag": "pt", "headerRegExps": [ { "regExp": ".*(?i)(nome).*", "confidence": 60 } ] }
],
"documentation": [
{ "source": "wikipedia", "reference": "https://en.wikipedia.org/wiki/Personal_name" }
],
"priority": 371
},
{
"semanticType": "NAME.FIRST",
"description": "First Name",
"pluginType": "java",
"signature": "slggsAEDZ26rz9dqs15eNF23j2w=",
"clazz": "com.cobber.fta.plugins.FirstName",
"validLocales": [
{
"localeTag": "en",
"headerRegExps": [ { "regExp": ".*(?i)(first.?name|fname|given.?name|forename|first_nm).*", "confidence": 95 },
{ "regExp": "(?i)(name|.*first.*|.*given.*)", "confidence": 60 }, { "regExp": "(?i).*city.*", "confidence": -100 } ],
"matchEntries": [ {
"regExpReturned": "[\\p{IsAlphabetic}]+[- \\p{IsAlphabetic}]*\\.?"
} ]
},
{
"localeTag": "de",
"headerRegExps": [ { "regExp": ".*(?i)(vornam).*", "confidence": 90 },
{ "regExp": "(?i)(first)", "confidence": 90 }, { "regExp": "(?i)(name)", "confidence": 60 } ],
"matchEntries": [ {
"regExpReturned": "\\p{IsAlphabetic}[- \\p{IsAlphabetic}]*"
} ]
},
{
"localeTag": "es",
"headerRegExps": [ { "regExp": ".*(?i)(nombre).*", "confidence": 60 } ],
"matchEntries": [ {
"regExpReturned": "\\p{IsAlphabetic}[- \\p{IsAlphabetic}]*"
} ]
},
{
"localeTag": "fr",
"headerRegExps": [ { "regExp": ".*(?i)(prénom|prenom).*", "confidence": 90 },
{ "regExp": "(?i)(first)", "confidence": 90 }, { "regExp": "(?i)(nom|name)", "confidence": 60 } ],
"matchEntries": [ {
"regExpReturned": "\\p{IsAlphabetic}[- \\p{IsAlphabetic}]*"
} ]
},
{
"localeTag": "it",
"headerRegExps": [ { "regExp": ".*(?i)(nome).*", "confidence": 60 } ],
"matchEntries": [ {
"regExpReturned": "\\p{IsAlphabetic}[- \\p{IsAlphabetic}]*"
} ]
},
{
"localeTag": "nl",
"headerRegExps": [ { "regExp": ".*(?i)(voornaam|vnaam).*", "confidence": 90 }, { "regExp": "(?i)(naam|name)", "confidence": 60 } ],
"matchEntries": [ {
"regExpReturned": "\\p{IsAlphabetic}[- \\p{IsAlphabetic}]*"
} ]
},
{
"localeTag": "pt",
"headerRegExps": [ { "regExp": "(?i)(nome)", "confidence": 60 } ],
"matchEntries": [ {
"regExpReturned": "\\p{IsAlphabetic}[- \\p{IsAlphabetic}]*"
} ]
}
],
"documentation": [
{ "source": "wikidata", "reference": "https://www.wikidata.org/wiki/Property:P735" },
{ "source": "schema", "reference": "https://schema.org/givenName" }
],
"priority": 372
},
{
"semanticType": "NAME.LAST",
"description": "Last Name",
"pluginType": "java",
"signature": "+h9v4tygGZxbEPbJLp5MDezGgME=",
"clazz": "com.cobber.fta.plugins.LastName",
"validLocales": [
{
"localeTag": "en",
"headerRegExps": [ { "regExp": ".*(?i)(surname|last.?name|lname|maiden.?name|name.?last|last_nm).*|last", "confidence": 90 },
{ "regExp": "(?i)(name|.*last.*)", "confidence": 60 }, { "regExp": "(?i).*city.*", "confidence": -100 } ],
"matchEntries": [ {
"regExpReturned": "\\p{IsAlphabetic}[- \\p{IsAlphabetic}]*"
} ]
},
{
"localeTag": "de",
"headerRegExps": [ { "regExp": ".*(?i)(nachname).*", "confidence": 90 }, { "regExp": "(?i)(name)", "confidence": 60 } ],
"matchEntries": [ {
"regExpReturned": "\\p{IsAlphabetic}[- \\p{IsAlphabetic}]*"
} ]
},
{
"localeTag": "el",
"headerRegExps": [ { "regExp": ".*(?i)(?u)(ΠΑΤΡΩΝΥΜΟ).*", "confidence": 90 }, { "regExp": "(?i)(ΟΝΟΜΑ)", "confidence": 60 } ],
"matchEntries": [ {
"regExpReturned": "\\p{IsAlphabetic}[- \\p{IsAlphabetic}]*"
} ]
},
{
"localeTag": "es",
"headerRegExps": [ { "regExp": ".*(?i)(apellido).*", "confidence": 90 }, { "regExp": ".*(?i)(nombre).*", "confidence": 60 },
{ "regExp": "(?i).*ciudad.*", "confidence": -100 } ],
"matchEntries": [ {
"regExpReturned": "\\p{IsAlphabetic}[- \\p{IsAlphabetic}]*"
} ]
},
{
"localeTag": "fr",
"headerRegExps": [ { "regExp": "(?i)(nom|name)", "confidence": 60 } ],
"matchEntries": [ {
"regExpReturned": "\\p{IsAlphabetic}[- \\p{IsAlphabetic}]*"
} ]
},
{
"localeTag": "it",
"headerRegExps": [ { "regExp": ".*(?i)(cognome).*", "confidence": 90 }, { "regExp": "(?i)(nome)", "confidence": 60 } ],
"matchEntries": [ {
"regExpReturned": "\\p{IsAlphabetic}[- \\p{IsAlphabetic}]*"
} ]
},
{
"localeTag": "nl",
"headerRegExps": [ { "regExp": ".*(?i)(achternaam|anaam).*", "confidence": 90 }, { "regExp": "(?i)(naam|name)", "confidence": 60 } ],
"matchEntries": [ {
"regExpReturned": "\\p{IsAlphabetic}[- \\p{IsAlphabetic}]*"
} ]
},
{
"localeTag": "pt",
"headerRegExps": [ { "regExp": ".*(?i)(sobrenome).*", "confidence": 90 }, { "regExp": "(?i)(nome)", "confidence": 60 } ],
"matchEntries": [ {
"regExpReturned": "\\p{IsAlphabetic}[- \\p{IsAlphabetic}]*"
} ]
}
],
"documentation": [
{ "source": "wikidata", "reference": "https://www.wikidata.org/wiki/Property:P734" },
{ "source": "wikipedia", "reference": "https://en.wikipedia.org/wiki/https://en.wikipedia.org/wiki/Surname" },
{ "source": "schema", "reference": "https://schema.org/familyName" }
],
"priority": 373
},
{
"semanticType": "NAME.MIDDLE",
"description": "Middle Name",
"pluginType": "java",
"signature": "3UGho+Z93uiqi9L8+qjAQ1pb0qQ=",
"clazz": "com.cobber.fta.plugins.MiddleName",
"validLocales": [
{
"localeTag": "en",
"headerRegExps": [ { "regExp": ".*(?i)(middle.?name).*|(?i)(mi|middle)", "confidence": 99, "mandatory": true } ],
"matchEntries": [ {
"regExpReturned": "\\p{IsAlphabetic}[- \\p{IsAlphabetic}]*"
} ]
}
],
"documentation": [
{ "source": "wikipedia", "reference": "https://en.wikipedia.org/wiki/Middle_name" },
{ "source": "schema", "reference": "https://schema.org/additionalName" }
],
"priority": 374
},
{
"semanticType": "NAME.MIDDLE_INITIAL",
"description": "Middle Initial",
"pluginType": "regex",
"signature": "5AG+x37vekPMlggzCTebzFWovPc=",
"validLocales": [
{
"localeTag": "en",
"headerRegExps": [
{ "regExp": ".*(?i)(middle.?init).*|(?i)(mi|middle)", "confidence": 99, "mandatory": true },
{ "regExp": "(?i)middle.*", "confidence": 90, "mandatory": true }
],
"matchEntries": [ {
"regExpsToMatch": [ "\\p{IsAlphabetic}", "\\p{IsAlphabetic}\\." ],
"regExpReturned": "\\p{IsAlphabetic}\\.?",
"isRegExpComplete": true
} ]
}
],
"documentation": [
{ "source": "wikipedia", "reference": "https://en.wikipedia.org/wiki/Middle_name" }
],
"threshold": 98,
"baseType": "STRING",
"priority": 375
},
{
"semanticType": "NAME.SUFFIX",
"description": "Name Suffix",
"pluginType": "list",
"signature": "O8pdYhB+VqM6qvj6Yc7Wt3JPhy0=",
"validLocales": [
{
"localeTag": "en",
"headerRegExps": [ { "regExp": "(?i)(suffix|suff|.*[_ ]suffix)", "confidence": 99, "mandatory": true }, { "regExp": "(?i).*suffix", "confidence": 85, "mandatory": true } ]
}
],
"content": {
"type": "resource",
"reference": "/reference/en_name_suffix.csv"
},
"documentation": [
{ "source": "wikidata", "reference": "https://www.wikidata.org/wiki/Property:P8017" },
{ "source": "wikipedia", "reference": "https://en.wikipedia.org/wiki/Suffix_(name)" }
],
"backout": "[ \\p{IsAlphabetic}.]+",
"threshold": 90,
"baseType": "STRING",
"priority": 376
},
{
"semanticType": "COMPANY_NAME",
"description": "Organization/Company Name",
"pluginType": "regex",
"signature": "gTynrjgOpvdzfWdVMRddP2Ksv8k=",
"validLocales": [
{
"localeTag": "en",
"headerRegExps": [
{ "regExp": "^(?i)(company|business|dba|organization|company.?name|business.?name|dba.?name|organization.?name|org.?name|vendor.?name)$", "confidence": 99, "mandatory": true },
{ "regExp": "^.*(?i)(company.?name|business.?name|organization.?name|dba.?name).*$", "confidence": 90, "mandatory": true }
],
"matchEntries": [ {
"regExpsToMatch": [ ".+", "\\p{IsAlphabetic}+" ],
"regExpReturned": "[-+|*:;!@\"/()', \\.\\p{IsAlphabetic}\\d]*",
"isRegExpComplete": false
} ]
},
{
"localeTag": "nl",
"headerRegExps": [
{ "regExp": "^(?i)(Handelsnaam|naam.?organisatie|organisatie)$", "confidence": 99, "mandatory": true }
],
"matchEntries": [ {
"regExpsToMatch": [ ".+", "\\p{IsAlphabetic}+" ],
"regExpReturned": "[-+|*:;!@\"/()', \\.\\p{IsAlphabetic}\\d]*",
"isRegExpComplete": false
} ]
}
],
"content": {
"type": "resource",
"reference": "/reference/us_companies_samples.csv"
},
"documentation": [
{ "source": "wikipedia", "reference": "https://https://en.wikipedia.org/wiki/Company" },
{ "source": "schema", "reference": "https://schema.org/Corporation" }
],
"baseType": "STRING",
"priority": 380
},
{
"semanticType": "FREE_TEXT",
"description": "Free Text field - e.g. Description, Notes, Comments, ...",
"pluginType": "java",
"signature": "7WbjWLZJ8Zdm+U8po/igrvDH3yE=",
"clazz": "com.cobber.fta.plugins.FreeText",
"validLocales": [
{ "localeTag": "bg", "headerRegExps": [ { "regExp": ".*(?i)(?u)(описание|Бележки|Забележки|коментар|причина|description).*", "confidence": 99, "mandatory": true } ] },
{ "localeTag": "ca", "headerRegExps": [ { "regExp": ".*(?i)(?u)(descripció|comentar|description).*", "confidence": 99, "mandatory": true } ] },
{ "localeTag": "da", "headerRegExps": [ { "regExp": ".*(?i)(?u)(beskrivelse|noter|kommentar|årsag|description).*", "confidence": 99, "mandatory": true } ] },
{ "localeTag": "de", "headerRegExps": [ { "regExp": ".*(?i)(bezeichnung|anmerkungen|bemerkungen|description).*", "confidence": 99, "mandatory": true } ] },
{ "localeTag": "en", "headerRegExps": [ { "regExp": ".*(?i)(description|notes|comment|reason).*|.*(?i)(desc)", "confidence": 99, "mandatory": true } ] },
{ "localeTag": "es", "headerRegExps": [ { "regExp": ".*(?i)(?u)(descripción|nota|motivo).*|.*(?i)(desc)", "confidence": 99, "mandatory": true } ] },
{ "localeTag": "fi", "headerRegExps": [ { "regExp": ".*(?i)(kuvaus|huomautukset|kommentti|syy|description).*|.*(?i)(desc)", "confidence": 99, "mandatory": true } ] },
{ "localeTag": "fr", "headerRegExps": [ { "regExp": ".*(?i)(description|remarques|commentaire|raison).*|.*(?i)(desc)", "confidence": 99, "mandatory": true } ] },
{ "localeTag": "ga", "headerRegExps": [ { "regExp": ".*(?i)(?u)(tuairisc|nótaí|trácht|fáth|description).*|.*(?i)(desc)", "confidence": 99, "mandatory": true } ] },
{ "localeTag": "hr", "headerRegExps": [ { "regExp": ".*(?i)(?u)(opis|napomene|komentar|razlog|description).*|.*(?i)(desc)", "confidence": 99, "mandatory": true } ] },
{ "localeTag": "hu", "headerRegExps": [ { "regExp": ".*(?i)(?u)(leírás|jegyzetek|megjegyzés|indoklás|description).*|.*(?i)(desc)", "confidence": 99, "mandatory": true } ] },
{ "localeTag": "it", "headerRegExps": [ { "regExp": ".*(?i)(descrizione|nota|Annotazioni|motivo|description).*|.*(?i)(desc)", "confidence": 99, "mandatory": true } ] },
{ "localeTag": "lv", "headerRegExps": [ { "regExp": ".*(?i)(apraksts|piezīmes|komentārs|iemesls|description).*|.*(?i)(desc)", "confidence": 99, "mandatory": true } ] },
{ "localeTag": "nl", "headerRegExps": [ { "regExp": ".*(?i)(omschrijving|opmerkingen|description).*|(?i)omsch.*", "confidence": 99, "mandatory": true } ] },
{ "localeTag": "pt", "headerRegExps": [ { "regExp": ".*(?i)(?u)(descrição|nota|motivo).*|.*(?i)(desc)", "confidence": 99, "mandatory": true } ] },
{ "localeTag": "ro", "headerRegExps": [ { "regExp": ".*(?i)(descriere|note|comentar|motiv|description).*", "confidence": 99, "mandatory": true } ] },
{ "localeTag": "ru", "headerRegExps": [ { "regExp": ".*(?i)(?u)(описание|description).*", "confidence": 99, "mandatory": true } ] },
{ "localeTag": "sk", "headerRegExps": [ { "regExp": ".*(?i)(?u)(popis|poznámky|komentár|dôvod|description).*|.*(?i)(desc)", "confidence": 99, "mandatory": true } ] },
{ "localeTag": "sv", "headerRegExps": [ { "regExp": ".*(?i)(?u)(beskrivning|anteckningar|kommentar|orsak|description).*|.*(?i)(desc)", "confidence": 99, "mandatory": true } ] },
{ "localeTag": "tr", "headerRegExps": [ { "regExp": ".*(?i)(?u)(açıklama|notlar|yorum|sebep|description).*|.*(?i)(desc)", "confidence": 99, "mandatory": true } ] }
],
"content": {
"type": "resource",
"reference": "/reference/_free_text_samples.csv"
},
"threshold": 70,
"baseType": "STRING",
"priority": 390
},
{
"semanticType": "IDENTIFIER",
"description": "Unique Identifier",
"pluginType": "java",
"signature": "RKNrRP3/trxIfbpsaz9soam8suY=",
"clazz": "com.cobber.fta.plugins.Identifier",
"validLocales": [
{
"localeTag": "*",
"headerRegExps": [ { "regExp": "(?i)(id|.*_id)", "confidence": 99 }, { "regExp": "(?i).*id", "confidence": 95 } ]
}
],
"documentation": [
{ "source": "wikipedia", "reference": "https://en.wikipedia.org/wiki/Identifier" },
{ "source": "schema", "reference": "https://schema.org/identifier" }
],
"priority": 400
}
]