用于主键统一的实体主数据对齐原子 skill,适用于通用行业数据接入场景。
本 Skill 支持多种实体主数据输入格式,核心数据来源包括:
说明:本 Skill 不包含数据采集功能,需要用户提供源数据和主数据标准。建议主数据标准清晰明确,以便进行准确的实体对齐。
本 Skill 提供全面的实体主数据对齐能力,涵盖多种对齐功能:
{
"source_info": {
"source_data": "company_data.csv",
"source_format": "csv",
"entity_count": 1000
},
"master_data_standard": {
"standard_name": "company_master_data",
"primary_key": "company_code",
"key_fields": ["company_name", "unified_social_credit_code"]
},
"alignment_rules": [
{
"rule_id": "RULE001",
"rule_type": "exact_match",
"match_fields": ["company_name"],
"confidence_threshold": 1.0
},
{
"rule_id": "RULE002",
"rule_type": "fuzzy_match",
"match_fields": ["company_name"],
"confidence_threshold": 0.9
}
],
"alignment_results": {
"total_entities": 1000,
"aligned_entities": 950,
"unmatched_entities": 50,
"alignment_time": "2024-03-15T10:00:00",
"duration": "30s"
},
"aligned_entities": [
{
"source_entity": {
"source_id": "SRC001",
"company_name": "示例股份有限公司",
"source_key": "COMP001"
},
"master_entity": {
"master_id": "MAST001",
"company_code": "COMP001",
"company_name": "示例股份有限公司",
"unified_social_credit_code": "91110000123456789X"
},
"alignment_type": "exact_match",
"confidence": 1.0,
"match_fields": ["company_name"]
}
],
"statistics": {
"entities_aligned": 950,
"entities_unmatched": 50,
"exact_matches": 800,
"fuzzy_matches": 150,
"alignment_accuracy": 0.95
}
}