Files
data-ge/demo/水务/水务-qwen3-next-80b-ge-desc.json
2025-11-14 00:58:00 +08:00

1 line
8.4 KiB
JSON
Raw Blame History

This file contains ambiguous Unicode characters

This file contains Unicode characters that might be confused with other characters. If you think that this is intentional, you can safely ignore this warning. Use the Escape button to reveal them.

{"role": "dimension", "time": {"range": null, "column": null, "has_gaps": null, "granularity": "unknown"}, "grain": ["account_id", "service_point_id"], "table": "water_meter_info", "columns": [{"name": "supply_office", "dtype": "string", "stats": {"max": null, "min": null, "std": null, "mean": null, "skewness": null}, "comment": "供应办公室,枚举值,非空", "enumish": true, "null_rate": 0.0, "top_values": [{"pct": 0.09090909090909093, "value": "宝山供水管理所"}, {"pct": 0.09090909090909093, "value": "黄浦供水管理所"}, {"pct": 0.09090909090909093, "value": "青东供水管理所"}, {"pct": 0.09090909090909093, "value": "虹口供水管理所"}, {"pct": 0.09090909090909093, "value": "闸北供水管理所"}, {"pct": 0.09090909090909093, "value": "松北供水管理所"}, {"pct": 0.09090909090909093, "value": "杨浦供水管理所"}, {"pct": 0.09090909090909093, "value": "长宁供水管理所"}, {"pct": 0.09090909090909093, "value": "闵行供水管理所"}, {"pct": 0.09090909090909093, "value": "徐汇供水管理所"}], "semantic_type": "dimension", "distinct_count": 11, "distinct_ratio": 0.03666666666666667, "pk_candidate_score": 0.1, "metric_candidate_score": 0.0}, {"name": "station", "dtype": "string", "stats": {"max": null, "min": null, "std": null, "mean": null, "skewness": null}, "comment": "站点名称,枚举值,非空", "enumish": true, "null_rate": 0.0, "top_values": [{"pct": 0.027777777777777776, "value": "新闸站"}, {"pct": 0.027777777777777776, "value": "宝杨站"}, {"pct": 0.027777777777777776, "value": "江川站"}, {"pct": 0.027777777777777776, "value": "长江站"}, {"pct": 0.027777777777777776, "value": "市光站"}, {"pct": 0.027777777777777776, "value": "徐泾站"}, {"pct": 0.027777777777777776, "value": "真北站"}, {"pct": 0.027777777777777776, "value": "半淞园站"}, {"pct": 0.027777777777777776, "value": "芙蓉江站"}, {"pct": 0.027777777777777776, "value": "密云站"}], "semantic_type": "dimension", "distinct_count": 36, "distinct_ratio": 0.12, "pk_candidate_score": 0.12, "metric_candidate_score": 0.0}, {"name": "district", "dtype": "string", "stats": {"max": null, "min": null, "std": null, "mean": null, "skewness": null}, "comment": "行政区,枚举值,非空", "enumish": true, "null_rate": 0.0, "top_values": [{"pct": 0.07692307692307693, "value": "普陀区"}, {"pct": 0.07692307692307693, "value": "闵行区"}, {"pct": 0.07692307692307693, "value": "嘉定区"}, {"pct": 0.07692307692307693, "value": "杨浦区"}, {"pct": 0.07692307692307693, "value": "徐汇区"}, {"pct": 0.07692307692307693, "value": "黄浦区"}, {"pct": 0.07692307692307693, "value": "松江区"}, {"pct": 0.07692307692307693, "value": "长宁区"}, {"pct": 0.07692307692307693, "value": "青浦区"}, {"pct": 0.07692307692307693, "value": "虹口区"}], "semantic_type": "dimension", "distinct_count": 13, "distinct_ratio": 0.043333333333333335, "pk_candidate_score": 0.043333333333333335, "metric_candidate_score": 0.0}, {"name": "meter_diameter", "dtype": "string", "stats": {"max": null, "min": null, "std": null, "mean": null, "skewness": null}, "comment": "水表直径,枚举值,非空", "enumish": true, "null_rate": 0.0, "top_values": [{"pct": 0.125, "value": "20mm"}, {"pct": 0.125, "value": "15mm"}, {"pct": 0.125, "value": "25mm"}, {"pct": 0.125, "value": "40mm"}, {"pct": 0.125, "value": "150mm"}, {"pct": 0.125, "value": "100mm"}, {"pct": 0.125, "value": "80mm"}, {"pct": 0.125, "value": "50mm"}], "semantic_type": "dimension", "distinct_count": 8, "distinct_ratio": 0.02666666666666667, "pk_candidate_score": 0.02666666666666667, "metric_candidate_score": 0.0}, {"name": "account_id", "dtype": "string", "stats": {"max": null, "min": null, "std": null, "mean": null, "skewness": null}, "comment": "账户ID未提供统计但为关键标识列", "enumish": null, "null_rate": null, "top_values": [], "semantic_type": "id", "distinct_count": null, "distinct_ratio": null, "pk_candidate_score": 1.0, "metric_candidate_score": 0.0}, {"name": "service_point_id", "dtype": "string", "stats": {"max": null, "min": null, "std": null, "mean": null, "skewness": null}, "comment": "服务点ID未提供统计但为关键标识列", "enumish": null, "null_rate": null, "top_values": [], "semantic_type": "id", "distinct_count": null, "distinct_ratio": null, "pk_candidate_score": 1.0, "metric_candidate_score": 0.0}, {"name": "station", "dtype": "string", "stats": {"max": null, "min": null, "std": null, "mean": null, "skewness": null}, "comment": "站点名称,枚举值,非空", "enumish": true, "null_rate": 0.0, "top_values": [{"pct": 0.027777777777777776, "value": "新闸站"}, {"pct": 0.027777777777777776, "value": "宝杨站"}, {"pct": 0.027777777777777776, "value": "江川站"}, {"pct": 0.027777777777777776, "value": "长江站"}, {"pct": 0.027777777777777776, "value": "市光站"}, {"pct": 0.027777777777777776, "value": "徐泾站"}, {"pct": 0.027777777777777776, "value": "真北站"}, {"pct": 0.027777777777777776, "value": "半淞园站"}, {"pct": 0.027777777777777776, "value": "芙蓉江站"}, {"pct": 0.027777777777777776, "value": "密云站"}], "semantic_type": "dimension", "distinct_count": 36, "distinct_ratio": 0.12, "pk_candidate_score": 0.12, "metric_candidate_score": 0.0}, {"name": "meter_type", "dtype": "string", "stats": {"max": null, "min": null, "std": null, "mean": null, "skewness": null}, "comment": "水表类型,枚举值,非空", "enumish": true, "null_rate": 0.0, "top_values": [{"pct": 0.2, "value": "容积式机械水表"}, {"pct": 0.2, "value": "速度式机械水表"}, {"pct": 0.2, "value": "电磁式远传水表"}, {"pct": 0.2, "value": "速度式机电远传水表"}, {"pct": 0.2, "value": "超声波式远传水表"}], "semantic_type": "dimension", "distinct_count": 5, "distinct_ratio": 0.016666666666666666, "pk_candidate_score": 0.016666666666666666, "metric_candidate_score": 0.0}, {"name": "meter_subtype", "dtype": "string", "stats": {"max": null, "min": null, "std": null, "mean": null, "skewness": null}, "comment": "水表子类型,枚举值,非空", "enumish": true, "null_rate": 0.0, "top_values": [{"pct": 0.1111111111111111, "value": "旋翼半液封式"}, {"pct": 0.1111111111111111, "value": "超声波式"}, {"pct": 0.1111111111111111, "value": "旋翼湿式(指针式)"}, {"pct": 0.1111111111111111, "value": "旋翼湿式(数字指针式)"}, {"pct": 0.1111111111111111, "value": "电磁式"}, {"pct": 0.1111111111111111, "value": "无直管段要求超声波式"}, {"pct": 0.1111111111111111, "value": "无直管段要求电磁式"}, {"pct": 0.1111111111111111, "value": "垂直螺翼干式"}, {"pct": 0.1111111111111111, "value": "机械容积式"}], "semantic_type": "dimension", "distinct_count": 9, "distinct_ratio": 0.03, "pk_candidate_score": 0.03, "metric_candidate_score": 0.0}, {"name": "meter_status", "dtype": "string", "stats": {"max": null, "min": null, "std": null, "mean": null, "skewness": null}, "comment": "水表状态,仅有效,非空", "enumish": true, "null_rate": 0.0, "top_values": [{"pct": 1.0, "value": "有效"}], "semantic_type": "dimension", "distinct_count": 1, "distinct_ratio": 0.0033333333333333335, "pk_candidate_score": 0.0033333333333333335, "metric_candidate_score": 0.0}, {"name": "installation_position", "dtype": "string", "stats": {"max": null, "min": null, "std": null, "mean": null, "skewness": null}, "comment": "安装位置,枚举值,非空", "enumish": true, "null_rate": 0.0, "top_values": [{"pct": 0.25, "value": "嵌墙表"}, {"pct": 0.25, "value": "管道井表"}, {"pct": 0.25, "value": "地下表"}, {"pct": 0.25, "value": "龙头表"}], "semantic_type": "dimension", "distinct_count": 4, "distinct_ratio": 0.013333333333333334, "pk_candidate_score": 0.013333333333333334, "metric_candidate_score": 0.0}], "quality": {"warning_hints": [], "failed_expectations": []}, "row_count": 300, "fk_candidates": [], "confidence_notes": ["role判定为dimension所有列均为低熵枚举型维度字段无数值型指标列符合维度表特征。", "grain推测为account_id和service_point_id二者为唯一标识符且无其他复合主键信息结合业务常识推断为粒度核心。", "time列未知无任何日期/时间列,无时间相关命名或统计,无法推断时间维度。", "primary_key_candidates基于account_id和service_point_id的高唯一性未发现重复及非空性推断置信度高。"], "primary_key_candidates": [["account_id", "service_point_id"]]}