我假设您的理想目标是在单个复杂查询中获取最多五个姓名和一个地址。此示例在 PostgreSQL 中。您没有指定数据库,但我相信 ORACLE 和 SQLServer 中存在推论。您将不得不做出自己的调整。
它有点乱,但它有效。简而言之,您使用 WINDOW 函数对每个唯一地址的多个名称进行排名。使用 WITH 子句按等级隔离每个名称。 LEFT JOIN 为少于五个名称的地址选择名称。
示例表:
DROP TABLE name_address;
CREATE TABLE name_address
(
first_name CHARACTER VARYING (50)
,last_name CHARACTER VARYING (50)
,addr_line1 CHARACTER VARYING (50)
,city CHARACTER VARYING (50)
,state CHARACTER VARYING (2)
,zip CHARACTER VARYING (5)
)
WITH (OIDS=TRUE);
ALTER TABLE name_address OWNER TO your_name_here;
样本数据:
INSERT INTO name_address (first_name, last_name, addr_line1, city, state, zip) SELECT 'John', 'Smith', '10 High Street', 'Beverly Hills NSW 2000', 'CA', '90210';
INSERT INTO name_address (first_name, last_name, addr_line1, city, state, zip) SELECT 'Jane', 'Smith', '10 High Street', 'Beverly Hills NSW 2000', 'CA', '90210';
INSERT INTO name_address (first_name, last_name, addr_line1, city, state, zip) SELECT 'Jeff', 'Smith', '12 High Street', 'Beverly Hills NSW 2000', 'CA', '90210';
INSERT INTO name_address (first_name, last_name, addr_line1, city, state, zip) SELECT 'Jean', 'Smith', '12 High Street', 'Beverly Hills NSW 2000', 'CA', '90210';
INSERT INTO name_address (first_name, last_name, addr_line1, city, state, zip) SELECT 'Jenn', 'Smith', '12 High Street', 'Beverly Hills NSW 2000', 'CA', '90210';
INSERT INTO name_address (first_name, last_name, addr_line1, city, state, zip) SELECT 'Jack', 'Smith', '12 High Street', 'Beverly Hills NSW 2000', 'CA', '90210';
INSERT INTO name_address (first_name, last_name, addr_line1, city, state, zip) SELECT 'Josh', 'Smith', '12 High Street', 'Beverly Hills NSW 2000', 'CA', '90210';
解决办法:
WITH nr AS (SELECT DISTINCT first_name, last_name, addr_line1, city, state, zip, COUNT(*) OVER(PARTITION BY zip, state, city, addr_line1 ORDER BY zip, state, city, addr_line1, last_name, first_name) AS name_rank
FROM name_address
GROUP BY first_name, last_name, addr_line1, city, state, zip
ORDER BY zip, state, city, addr_line1, name_rank)
,n1 AS(SELECT nr.first_name, nr.last_name, nr.addr_line1, nr.city, nr.state, nr.zip
FROM nr
WHERE nr.name_rank = 1)
,n2 AS(SELECT nr.first_name, nr.last_name, nr.addr_line1, nr.city, nr.state, nr.zip
FROM nr
WHERE nr.name_rank = 2)
,n3 AS(SELECT nr.first_name, nr.last_name, nr.addr_line1, nr.city, nr.state, nr.zip
FROM nr
WHERE nr.name_rank = 3)
,n4 AS(SELECT nr.first_name, nr.last_name, nr.addr_line1, nr.city, nr.state, nr.zip
FROM nr
WHERE nr.name_rank = 4)
,n5 AS(SELECT nr.first_name, nr.last_name, nr.addr_line1, nr.city, nr.state, nr.zip
FROM nr
WHERE nr.name_rank = 5)
SELECT DISTINCT n1.first_name
, n1.last_name
, n2.first_name
, n2.last_name
, n3.first_name
, n3.last_name
, n4.first_name
, n4.last_name
, n5.first_name
, n5.last_name
, na.addr_line1
, na.city
, na.state
, na.zip
FROM name_address AS na
LEFT JOIN n1 ON n1.addr_line1 = na.addr_line1 AND n1.city = na.city AND n1.state = na.state AND n1.zip = na.zip
LEFT JOIN n2 ON n2.addr_line1 = na.addr_line1 AND n2.city = na.city AND n2.state = na.state AND n2.zip = na.zip
LEFT JOIN n3 ON n3.addr_line1 = na.addr_line1 AND n3.city = na.city AND n3.state = na.state AND n3.zip = na.zip
LEFT JOIN n4 ON n4.addr_line1 = na.addr_line1 AND n4.city = na.city AND n4.state = na.state AND n4.zip = na.zip
LEFT JOIN n5 ON n5.addr_line1 = na.addr_line1 AND n5.city = na.city AND n5.state = na.state AND n5.zip = na.zip;
这是最终输出:
“简”;“史密斯”;“约翰”;“史密斯”;“”;“”;“”;“”;“”;“”;“高街 10 号”;“2000 年新南威尔士州比佛利山庄”; "CA";"90210"
“Jack”;“Smith”;“Jean”;“Smith”;“Jeff”;“Smith”;“Jenn”;“Smith”;“Josh”;“Smith”;“12 High Street”;“Beverly Hills NSW 2000";"CA";"90210"