join comma delimited data column
my table1 is :
T1
col1 col2
C1 john
C2 alex
C3 piers
C4 sara
and so table 2:
T2
col1 col2
R1 C1,C2,C4
R2 C3,C4
R3 C1,C4
how to result this?:
query result
col1 col2
R1 john,alex,sara
R2 piers,sara
R3 john,sara
please help me?
Solution 1:
Ideally, your best solution would be to normalize Table2 so you are not storing a comma separated list.
Once you have this data normalized then you can easily query the data. The new table structure could be similar to this:
CREATE TABLE T1
(
[col1] varchar(2),
[col2] varchar(5),
constraint pk1_t1 primary key (col1)
);
INSERT INTO T1
([col1], [col2])
VALUES
('C1', 'john'),
('C2', 'alex'),
('C3', 'piers'),
('C4', 'sara')
;
CREATE TABLE T2
(
[col1] varchar(2),
[col2] varchar(2),
constraint pk1_t2 primary key (col1, col2),
constraint fk1_col2 foreign key (col2) references t1 (col1)
);
INSERT INTO T2
([col1], [col2])
VALUES
('R1', 'C1'),
('R1', 'C2'),
('R1', 'C4'),
('R2', 'C3'),
('R2', 'C4'),
('R3', 'C1'),
('R3', 'C4')
;
Normalizing the tables would make it much easier for you to query the data by joining the tables:
select t2.col1, t1.col2
from t2
inner join t1
on t2.col2 = t1.col1
See Demo
Then if you wanted to display the data as a comma-separated list, you could use FOR XML PATH
and STUFF
:
select distinct t2.col1,
STUFF(
(SELECT distinct ', ' + t1.col2
FROM t1
inner join t2 t
on t1.col1 = t.col2
where t2.col1 = t.col1
FOR XML PATH ('')), 1, 1, '') col2
from t2;
See Demo.
If you are not able to normalize the data, then there are several things that you can do.
First, you could create a split function that will convert the data stored in the list into rows that can be joined on. The split function would be similar to this:
CREATE FUNCTION [dbo].[Split](@String varchar(MAX), @Delimiter char(1))
returns @temptable TABLE (items varchar(MAX))
as
begin
declare @idx int
declare @slice varchar(8000)
select @idx = 1
if len(@String)<1 or @String is null return
while @idx!= 0
begin
set @idx = charindex(@Delimiter,@String)
if @idx!=0
set @slice = left(@String,@idx - 1)
else
set @slice = @String
if(len(@slice)>0)
insert into @temptable(Items) values(@slice)
set @String = right(@String,len(@String) - @idx)
if len(@String) = 0 break
end
return
end;
When you use the split, function you can either leave the data in the multiple rows or you can concatenate the values back into a comma separated list:
;with cte as
(
select c.col1, t1.col2
from t1
inner join
(
select t2.col1, i.items col2
from t2
cross apply dbo.split(t2.col2, ',') i
) c
on t1.col1 = c.col2
)
select distinct c.col1,
STUFF(
(SELECT distinct ', ' + c1.col2
FROM cte c1
where c.col1 = c1.col1
FOR XML PATH ('')), 1, 1, '') col2
from cte c
See Demo.
A final way that you could get the result is by applying FOR XML PATH
directly.
select col1,
(
select ', '+t1.col2
from t1
where ','+t2.col2+',' like '%,'+cast(t1.col1 as varchar(10))+',%'
for xml path(''), type
).value('substring(text()[1], 3)', 'varchar(max)') as col2
from t2;
See SQL Fiddle with Demo
Solution 2:
Here's a way of splitting the data without a function, then using the standard XML PATH
method for getting the CSV list:
with CTE as
(
select T2.col1
, T1.col2
from T2
inner join T1 on charindex(',' + T1.col1 + ',', ',' + T2.col2 + ',') > 0
)
select T2.col1
, col2 = stuff(
(
select ',' + CTE.col2
from CTE
where T2.col1 = CTE.col1
for xml path('')
)
, 1
, 1
, ''
)
from T2
SQL Fiddle with demo.
As has been mentioned elsewhere in this question it is hard to query this sort of denormalised data in any sort of efficient manner, so your first priority should be to investigate updating the table structure, but this will at least allow to get the results you require.
Solution 3:
If you wanted to do this task in oracle we can use listagg
and can accomplish this easily.
A possible equivalent available in SQL Server for listagg
is Stuff
So using stuff you can try with following query:
SELECT T2.Col1,
Stuff((SELECT ',' + CAST(T1.Col2 AS VARCHAR(100))
FROM T1
WHERE T2.Col2 LIKE T1.Col1
FOR Xml Path('')),
1,
1,
'')
FROM T2
Solution 4:
First write a table value function for split col2 on tbl2.
CREATE FUNCTION [dbo].[Split](@String varchar(100), @Delimiter char(1))
returns @temptable TABLE (items VARCHAR(5))
as
begin
declare @idx int
declare @slice VARCHAR(5)
select @idx = 1
if len(@String)<1 or @String is null return
while @idx!= 0
begin
set @idx = charindex(@Delimiter,@String)
if @idx!=0
set @slice = left(@String,@idx - 1)
else
set @slice = @String
if(len(@slice)>0)
insert into @temptable(Items) values(@slice)
set @String = right(@String,len(@String) - @idx)
if len(@String) = 0 break
end
return
end
Go
;WITH SplitList
AS ( SELECT T2.Col1 ,
T1.Col2
FROM T2
CROSS APPLY dbo.Split(T2.Col2, ',') S
INNER JOIN T1 ON T1.Col1 = S.Items
)
SELECT T2.Col1 ,
STUFF(( SELECT ', ' + SplitList.Col2
FROM SplitList
WHERE SplitList.Col1 = T2.Col1
FOR
XML PATH('')
), 1, 2, '')
FROM T2
Solution 5:
If you are like me and you are a stickler for CTE's especially recursive CTE's as supposed to STUFF and XML Path:
DECLARE @T1 TABLE (
col1 CHAR(2),
col2 VARCHAR(10)
)
INSERT INTO @T1
VALUES ('C1', 'john'),
('C2', 'alex'),
('C3', 'piers'),
('C4', 'sara');
DECLARE @T2 TABLE (
col1 CHAR(2),
col2 CHAR(100)
)
INSERT INTO @T2
VALUES ('R1', 'C1,C2,C4'),
('R2', 'C3,C4'),
('R3', 'C1,C4');
WITH T2Sorted AS (
SELECT col1, col2, RN = ROW_NUMBER() OVER (ORDER BY col1) FROM @T2
), CTERecursionOnT2 AS (
SELECT RN, col1, col2, 0 AS PrevCharIndex, CHARINDEX(',', col2, 1) AS NextCharIndex FROM T2Sorted
UNION ALL
SELECT a.RN, a.col1, a.col2, b.NextCharIndex, CHARINDEX(',', a.col2, b.NextCharIndex + 1)
FROM T2Sorted a
JOIN CTERecursionOnT2 b ON a.RN = b.RN
WHERE b.NextCharIndex > 0
), CTEIndividualCol2Items AS (
SELECT *, SUBSTRING(col2, PrevCharIndex + 1, CASE WHEN NextCharIndex = 0 THEN LEN(col2) ELSE NextCharIndex - 1 END - PrevCharIndex) AS itemCol2
FROM CTERecursionOnT2
), CTELookupT1 AS (
SELECT a.col1, b.col2, RN = ROW_NUMBER() OVER (PARTITION BY a.col1 ORDER BY a.PrevCharIndex)
FROM CTEIndividualCol2Items a
JOIN @T1 b ON a.itemCol2 = b.col1
), CTERecursionOnLookupT1 AS (
SELECT col1, CAST(col2 AS VARCHAR(MAX)) AS col2, RN
FROM CTELookupT1
WHERE RN = 1
UNION ALL
SELECT a.col1, b.col2 + ',' + a.col2, a.RN
FROM CTELookupT1 a
JOIN CTERecursionOnLookupT1 b ON a.col1 = b.col1 AND a.RN = b.RN + 1
), CTEFinal AS (
SELECT *, RNDesc = ROW_NUMBER() OVER (PARTITION BY col1 ORDER BY RN DESC)
FROM CTERecursionOnLookupT1
)
SELECT col1, col2
FROM CTEFinal
WHERE RNDesc = 1
ORDER BY col1
Obviously you could break up the first recursion part into separate functions as the already agreed solution has suggested i.e. CTERecursionOnT2 and thus CTEIndividualCol2Items can be your alternative Split function (I would include the order id as well), and thus:
;WITH CTEIndividualCol2Items AS (
SELECT a.col1, b.value as itemCol2, b.id AS PrevCharIndex
FROM @T2 a
CROSS APPLY (
SELECT id, items FROM dbo.Split(a.col2, ',')
) b
) ...
and you split function:
CREATE FUNCTION dbo.Split(@String varchar(100), @Delimiter char(1))
RETURNS TABLE
AS
RETURN
(
WITH CTERecursion AS (
SELECT id = 1, PrevCharIndex = 0, NextCharIndex = CHARINDEX(@Delimiter, @String, 1)
UNION ALL
SELECT id + 1, NextCharIndex, CHARINDEX(@Delimiter, @String, NextCharIndex + 1) FROM CTERecursion WHERE NextCharIndex > 0
)
SELECT Id, items = SUBSTRING(@String, PrevCharindex + 1, (CASE WHEN NextCharIndex = 0 THEN LEN(@String) ELSE NextCharIndex - 1 END) - PrevCharIndex)
FROM CTERecursion
WHERE @String > ''
)