基于igraph的网络出行分配

基于igraph的网络出行分配,r,optimization,igraph,shortest-path,R,Optimization,Igraph,Shortest Path,我的问题是: 我有一个街道网络df.net和一个包含trips df.trips的起点和目的地的列表 我需要找到所有链接上的流 library(dplyr) df.net = tribble(~from, ~to, ~weight,1,2,1,2,1,1,1,9,3,9,1,2,2,10,1,10,2,2,9,10,8,10,9,15,9,8,1,8,9,2,7,8,2,12,7,3,9,12,10,12,9,9,12,6,2,6,12,5,11,12,3,12,11,3,5,6,1,11,5

我的问题是:

我有一个街道网络df.net和一个包含trips df.trips的起点和目的地的列表

我需要找到所有链接上的流

library(dplyr)

df.net = tribble(~from, ~to, ~weight,1,2,1,2,1,1,1,9,3,9,1,2,2,10,1,10,2,2,9,10,8,10,9,15,9,8,1,8,9,2,7,8,2,12,7,3,9,12,10,12,9,9,12,6,2,6,12,5,11,12,3,12,11,3,5,6,1,11,5,4,5,11,3,11,4,3,4,3,5,3,10,4,10,11,10)

df.trips = tribble(~from, ~to, ~N,1,2,45,1,4,24,1,5,66,1,9,12,1,11,54,2,3,63,2,4,22,2,7,88,2,12,44,3,2,6,3,8,43,3,10,20,3,11,4,4,1,9,4,5,7,4,6,35,4,9,1,5,7,55,5,8,21,5,1,23,5,7,12,5,2,18,6,2,31,6,3,6,6,5,15,6,8,19,7,1,78,7,2,48,7,3,92,7,6,6,8,2,77,8,4,5,8,5,35,8,6,63,8,7,22)
这是我的解决方案:

library(igraph)

# I construct a directed igraph network:
graph = igraph::graph_from_data_frame(d=df.net, directed=T)
plot(graph)

# I make a vector of edge_ids:
edges = paste0(df.net$from,":",df.net$to)

# and an empty vector of same length to fill with the flow afterwards:
N = integer(length(edges))

# I loop through all Origin-Destination-pairs:
for(i in 1:nrow(df.trips)){

  # provides one shortest path between one Origin & one Destination:
  path = shortest_paths(graph = graph, 
                         from = as.character(df.trips$from[i]), 
                         to = as.character(df.trips$to[i]), 
                         mode = "out", 
                         weights = NULL)

  # Extract the names of vetices on the path:
  a = names(path$vpath[[1]])

  # Make a vector of the edge_ids:  
  a2 = a[2:length(a)]
  a = a[1:(length(a)-1)]
  a = paste0(a,":",a2)  

  # and fill the vector with the trips
  v = integer(length(edges))
  v[edges %in% a] = pull(df.trips[i,3])

  # adding the trips of this iteration to the sum
  N = N + v

}

# attach vector to network-dataframe:
df.net = data.frame(df.net, N)
理论上它是有效的。我的真实网络只需要大约8小时,就可以在一个链接略少于50000条的网络上完成大约500000个起点-终点对

我很确定我的for循环就是罪魁祸首

因此,我关于优化的问题是:

1是否有一个igraph函数可以简单地执行我想要执行的操作?我找不到它

2也许有另一个更适合我需要的包,我没有偶然发现

3如果不是,我是否应该通过使用Rcpp包重写来提高循环性能

不管怎样,我很感激你能给我的任何帮助。
提前谢谢

我希望有一个更快的解决方案,尽管我从您那里得到的结果略有不同

这种方法使用data.table进行多线程处理,每个顶点只调用一次IGRAPHE::shorest_路径,并避免使用图的名称属性,直到最后一步

library(igraph)
library(tibble)
library(data.table)
library(zoo)
library(purrr)
df.net = tribble(~from, ~to, ~weight,1,2,1,2,1,1,1,9,3,9,1,2,2,10,1,10,2,2,9,10,8,10,9,15,9,8,1,8,9,2,7,8,2,12,7,3,9,12,10,12,9,9,12,6,2,6,12,5,11,12,3,12,11,3,5,6,1,11,5,4,5,11,3,11,4,3,4,3,5,3,10,4,10,11,10)
graph = igraph::graph_from_data_frame(d=df.net, directed=T)
df.trips = tribble(~from, ~to, ~N,1,2,45,1,4,24,1,5,66,1,9,12,1,11,54,2,3,63,2,4,22,2,7,88,2,12,44,3,2,6,3,8,43,3,10,20,3,11,4,4,1,9,4,5,7,4,6,35,4,9,1,5,7,55,5,8,21,5,1,23,5,7,12,5,2,18,6,2,31,6,3,6,6,5,15,6,8,19,7,1,78,7,2,48,7,3,92,7,6,6,8,2,77,8,4,5,8,5,35,8,6,63,8,7,22)
l.trips <- split(df.trips,1:nrow(df.trips))


setDT(df.trips)
Result <- df.trips[,setnames(lapply(shortest_paths(graph = graph,from= from,to = to,weights=NULL,mode = "out")$vpath,
                 function(x){zoo::rollapply(x,width=2,c)}) %>% map2(.,N,~ {.x %x% rep(1,.y)} %>% as.data.frame) %>%
           rbindlist %>% .[,.N,by = c("V1","V2")],c("new.from","new.to","N")),by=from][,sum(N),by = c("new.from","new.to")]
Result[,`:=`(new.from = V(graph)$name[Result$new.from],
             new.to = V(graph)$name[Result$new.to])]
#   new.from new.to  V1
# 1:        1      2 320
# 2:        2     10 161
# 3:        1      9 224
# 4:        9      8  73
# 5:       10     11 146
# 6:       11      4 102
# 7:        2      1 167
# 8:        9     12 262
# 9:        4      3  44
#10:        9      1 286
#11:       12      6  83
#12:       12     11  24
#13:       11      5  20
#14:       10      2  16
#15:       11     12  35
#16:       12      7 439
#17:        8      9 485
#18:        7      8 406
#19:        6     12 202

谢谢我去看看!这种差异可能可以通过只分配一条最短路径来解释,我们的代码选择了不同的路径,尽管有时第二条路径同样快。我很难理解您的结果:在数据帧的第二行中有链接2>4,但在我的网络中,这两个节点之间没有直接链接,请参见我发现了我们的结果之间存在差异的原因,因为不应该有任何差异。更改代码中的那一行会产生我的结果:路径正确!追求这些名字会严重影响表演。谢谢我有一个解决办法。我明天就去做!我用10000对OD样本在我的大网络上检查了你的方法。花了4.5分钟。我的代码通常需要5分钟左右。因此,我需要寻找其他方法来改进代码。我试图实现igraph::shortest_paths-functions只在每个原点为所有目的地调用一次,而不是分别为每个目的地调用一次