在SQL Server中實現最短路徑搜尋的解決方案

最後更新：2018-12-08 來源：互聯網

上載者：User

創建阿里雲帳戶，並獲得超過 40 款產品的免費試用版；而企業帳戶則可以享有總值 $1200 的免費試用版。立即註冊！

開始

這是去年的問題了，今天在整理郵件的時候才發現這個問題，感覺頂有意思的，特記錄下來。

在表RelationGraph中，有三個欄位（ID,Node,RelatedNode）,其中Node和RelatedNode兩個欄位描述兩個節點的串連關係；現在要求，找出從節點"p"至節點"j"，最短路徑（即經過的節點最少）。

圖1.

解析：

了能夠更好的描述表RelationGraph中欄位Node和 RelatedNode的關係，我在這裡特意使用一個圖形來描述，
2.

圖2.

在圖2，可清晰的看出各個節點直接如何相連，也可以清楚的看出節點"p"至節點"j"的的幾種可能路徑。

從上面可以看出第2種可能路徑，經過的節點最少。

為瞭解決開始的問題，我參考了兩種方法，

第1方法是，

參考單源最短路徑演算法：Dijkstra(迪傑斯特拉)演算法，主要特點是以起始點為中心向外層層擴充，直到擴充到終點為止。

圖3.

第2方法是，

針對第1種方法的改進，就是採用多源點方法，這裡就是以節點"p"和節點"j"為中心向外層擴充，直到兩圓外切點，4. ：

圖4.

實現：

在接下來，我就描述在SQL Server中，如何?。當然我這裡採用的前面說的第2種方法，以"P"和"J"為始點像中心外層層擴充。

這裡提供有表RelactionGraph的create& Insert資料的指令碼：

複製代碼代碼如下:use TestDB

if object_id('RelactionGraph') Is not null drop table RelactionGraph

create table RelactionGraph(ID int identity,Item nvarchar(50),RelactionItem nvarchar(20),constraint PK_RelactionGraph primary key(ID))

create nonclustered index IX_RelactionGraph_Item on RelactionGraph(Item) include(RelactionItem)

create nonclustered index IX_RelactionGraph_RelactionItem on RelactionGraph(RelactionItem) include(Item)

insert into RelactionGraph (Item, RelactionItem ) values

('a','b'),('a','c'),('a','d'),('a','e'),

('b','f'),('b','g'),('b','h'),

('c','i'),('c','j'),

('f','k'),('f','l'),

('k','o'),('k','p'),

('o','i'),('o','l')

編寫一個預存程序up_GetPath複製代碼代碼如下:use TestDB
go
--Procedure:
if object_id('up_GetPath') Is not null
Drop proc up_GetPath
go
create proc up_GetPath
(
@Node nvarchar(50),
@RelatedNode nvarchar(50)
)
As
set nocount on

declare
@level smallint =1, --當前搜尋的深度
@MaxLevel smallint=100, --最大可搜尋深度
@Node_WhileFlag bit=1, --以@Node作為中心進行搜尋時候，作為能否迴圈搜尋的標記
@RelatedNode_WhileFlag bit=1 --以@RelatedNode作為中心進行搜尋時候，作為能否迴圈搜尋的標記

--如果直接找到兩個Node存在直接關係就直接返回
if Exists(select 1 from RelationGraph where (Node=@Node And RelatedNode=@RelatedNode) or (Node=@RelatedNode And RelatedNode=@Node) ) or @Node=@RelatedNode
begin
select convert(nvarchar(2000),@Node + ' --> '+ @RelatedNode) As RelationGraphPath,convert(smallint,0) As StopCount
return
end

if object_id('tempdb..#1') Is not null Drop Table #1 --暫存資料表#1，儲存的是以@Node作為中心向外擴充的各節點資料
if object_id('tempdb..#2') Is not null Drop Table #2 --暫存資料表#2，儲存的是以@RelatedNode作為中心向外擴充的各節點資料

create table #1(
Node nvarchar(50),--相對源點
RelatedNode nvarchar(50), --相對目標
Level smallint --深度
)

create table #2(Node nvarchar(50),RelatedNode nvarchar(50),Level smallint)

insert into #1 ( Node, RelatedNode, Level )
select Node, RelatedNode, @level from RelationGraph a where a.Node =@Node union --正向：以@Node作為源查詢
select RelatedNode, Node, @level from RelationGraph a where a.RelatedNode = @Node --反向：以@Node作為目標進行查詢
set @Node_WhileFlag=sign(@@rowcount)

insert into #2 ( Node, RelatedNode, Level )
select Node, RelatedNode, @level from RelationGraph a where a.Node =@RelatedNode union --正向：以@RelatedNode作為源查詢
select RelatedNode, Node, @level from RelationGraph a where a.RelatedNode = @RelatedNode --反向：以@RelatedNode作為目標進行查詢
set @RelatedNode_WhileFlag=sign(@@rowcount)

--如果在表RelationGraph中找不到@Node 或 @RelatedNode 資料，就直接跳過後面的While過程
if not exists(select 1 from #1) or not exists(select 1 from #2)
begin
goto While_Out
end

while not exists(select 1 from #1 a inner join #2 b on b.RelatedNode=a.RelatedNode) --判斷是否出現切點
and (@Node_WhileFlag|@RelatedNode_WhileFlag)>0 --判斷是否能搜尋
And @level<@MaxLevel --控制深度
begin
if @Node_WhileFlag >0
begin
insert into #1 ( Node, RelatedNode, Level )
--正向
select a.Node,a.RelatedNode,@level+1
From RelationGraph a
where exists(select 1 from #1 where RelatedNode=a.Node And Level=@level) And
Not exists(select 1 from #1 where Node=a.Node)
union
--反向
select a.RelatedNode,a.Node,@level+1
From RelationGraph a
where exists(select 1 from #1 where RelatedNode=a.RelatedNode And Level=@level) And
Not exists(select 1 from #1 where Node=a.RelatedNode)

set @Node_WhileFlag=sign(@@rowcount)

end

if @RelatedNode_WhileFlag >0
begin
insert into #2 ( Node, RelatedNode, Level )
--正向
select a.Node,a.RelatedNode,@level+1
From RelationGraph a
where exists(select 1 from #2 where RelatedNode=a.Node And Level=@level) And
Not exists(select 1 from #2 where Node=a.Node)
union
--反向
select a.RelatedNode,a.Node,@level+1
From RelationGraph a
where exists(select 1 from #2 where RelatedNode=a.RelatedNode And Level=@level) And
Not exists(select 1 from #2 where Node=a.RelatedNode)
set @RelatedNode_WhileFlag=sign(@@rowcount)
end

select @level+=1
end

While_Out:

--下面是構造返回的結果路徑
if object_id('tempdb..#Path1') Is not null Drop Table #Path1
if object_id('tempdb..#Path2') Is not null Drop Table #Path2

;with cte_path1 As
(
select a.Node,a.RelatedNode,Level,convert(nvarchar(2000),a.Node+' -> '+a.RelatedNode) As RelationGraphPath,Convert(smallint,1) As PathLevel From #1 a where exists(select 1 from #2 where RelatedNode=a.RelatedNode)
union all
select b.Node,a.RelatedNode,b.Level,convert(nvarchar(2000),b.Node+' -> '+a.RelationGraphPath) As RelationGraphPath ,Convert(smallint,a.PathLevel+1) As PathLevel
from cte_path1 a
inner join #1 b on b.RelatedNode=a.Node
and b.Level=a.Level-1
)
select * Into #Path1 from cte_path1

;with cte_path2 As
(
select a.Node,a.RelatedNode,Level,convert(nvarchar(2000),a.Node) As RelationGraphPath,Convert(smallint,1) As PathLevel From #2 a where exists(select 1 from #1 where RelatedNode=a.RelatedNode)
union all
select b.Node,a.RelatedNode,b.Level,convert(nvarchar(2000),a.RelationGraphPath+' -> '+b.Node) As RelationGraphPath ,Convert(smallint,a.PathLevel+1)
from cte_path2 a
inner join #2 b on b.RelatedNode=a.Node
and b.Level=a.Level-1
)
select * Into #Path2 from cte_path2

;with cte_result As
(
select a.RelationGraphPath+' -> '+b.RelationGraphPath As RelationGraphPath,a.PathLevel+b.PathLevel -1 As StopCount,rank() over(order by a.PathLevel+b.PathLevel) As Result_row
From #Path1 a
inner join #Path2 b on b.RelatedNode=a.RelatedNode
and b.Level=1
where a.Level=1
)
select distinct RelationGraphPath,StopCount From cte_result where Result_row=1
go

上面的預存程序，主要分為兩大部分，第1部分是實現如何搜尋，第2部分實現如何構造返回結果。其中第1部分的代碼根據前面的方法2，通過@Node 和 @RelatedNode 兩個節點向外層搜尋，每次搜尋返回的節點都儲存至暫存資料表#1和#2，再判斷暫存資料表#1和#2有沒有出現切點，如果出現就說明已找到最短的路徑（經過多節點數最少），否則就繼續迴圈搜尋，直到迴圈至最大的搜尋深度（@MaxLevel smallint=100）或找到切點。要是到100層都沒搜尋到切點，將放棄搜尋。這裡使用最大可搜尋深度@MaxLevel，目的是控制由於資料量大可能會導致效能差，因為在這裡資料量與搜尋效能成反比。代碼中還說到一個正向和反向搜尋，主要是相對Node 和 RelatedNode來說，它們兩者互為參照對象，進行向外搜尋使用。

下面是預存程序的執行：

複製代碼代碼如下:use TestDB

exec dbo.up_GetPath

@Node = 'p',

@RelatedNode = 'j'

你可以根據需要來，賦予@Node 和 @RelatedNode不同的值。

拓展：

前面的例子，可擴充至城市的大眾運輸路線，提供兩個網站，搜尋經過這兩個網站最少網站大眾運輸路線；可以擴充至社區的人際關係的搜尋，如一個人與另一個人想認識，那麼他們直接要經過多少個人才可以。除了人與人直接有直接的朋友、親戚關聯，還可以通過人與物有關聯找到人與人關聯，如幾個作家通過出版一個本，那麼就說明這幾個人可以通過某一本書的作者列表中找到他們存在共同出版書籍的關聯，這為搜尋兩個人認識路徑提供參考。這問題可能會非常大複雜，但可以這樣的擴充。

小結：

這裡只是找兩個節點的所有路徑中，節點數最少的路徑，在實際的應用中，可能會碰到比這裡更複雜的情況。在其他的環境或情境可能會帶有長度，時間，多節點，多範圍等一些資訊。無論如何，一般都要參考一些原理，演算法來實現。

本文章原先以中文撰寫並發佈於 aliyun.com，亦設英文版本，僅作資訊用途。本網站不對文章的準確性，完整性或可靠性或其任何翻譯作出任何明示或暗示的陳述或保證。如對該文章有任何疑慮或投訴，請傳送電郵至 info-contact@alibabacloud.com 並提供相關疑慮或投訴的詳細說明。職員會於 5 個工作天內與您聯絡，一經驗證之後，即會刪除該侵權內容。

A Free Trial That Lets You Build Big!

Start building with 50+ products and up to 12 months usage for Elastic Compute Service

Get Started for Free

Sales Support

1 on 1 presale consultation

Chat Contact Sales
After-Sales Support

24/7 Technical Support 6 Free Tickets per Quarter Faster Response

Open a Ticket
Alibaba Cloud offers highly flexible support services tailored to meet your exact needs.

Learn More