【问题标题】:Python "RuntimeError: maximum recursion depth exceeded" in depth-first search深度优先搜索中的Python“RuntimeError:超出最大递归深度”
【发布时间】:2017-08-21 12:46:28
【问题描述】:

我正在尝试为有向图实现深度优先搜索 (DFS) 算法,如 Cormen 等人 Introduction to Algorithms (3rd ed.) 中所述。到目前为止,这是我的实现:

import pytest
from collections import OrderedDict
import copy


class Node(object):
    def __init__(self, color='white', parent=None, d=None, f=None):
        self.color = color
        self.parent = parent
        self.d = d          # Discovery time
        self.f = f          # Finishing time


class Graph(object):
    def __init__(self, edges, node_indices=None):
        self.edges = edges
        self.nodes = self.initialize_nodes(node_indices )
        self.adj = self.initialize_adjacency_list()

    def initialize_nodes(self, node_indices=None):
        if node_indices is None:
            node_indices = sorted(list(set(node for edge in self.edges for node in edge)))
        return OrderedDict([(node_index, Node()) for node_index in node_indices])

    def initialize_adjacency_list(self):
        A = {node: [] for node in self.nodes}
        for edge in self.edges:
            u, v = edge
            A[u].append(v)
        return A

    def dfs(self):
        self.time = 0
        for u, node in self.nodes.items():
            if node.color == 'white':
                self.dfs_visit(u)

    def dfs_visit(self, u):
        self.time += 1
        self.nodes[u].d = self.time
        self.nodes[u].color = 'gray'
        for v in self.adj[u]:
            if self.nodes[v].color == 'white':
                self.nodes[v].parent = u
                self.dfs_visit(v)
        self.nodes[u].color = 'black'
        self.time += 1
        self.nodes[u].f = self.time

    @staticmethod
    def transpose(edges):
        return [(v,u) for (u,v) in edges]

    def strongly_connected_components(self):
        self.dfs()
        finishing_times = {u: node.f for u, node in self.nodes.items()}
        self.__init__(self.transpose(self.edges))
        node_indices = sorted(finishing_times, key=finishing_times.get, reverse=True)
        self.nodes = self.initialize_nodes(node_indices)
        self.dfs()
        return self.trees()

    def trees(self):
        _trees = []
        nodes = copy.deepcopy(self.nodes)
        while nodes:
            for u, node in nodes.items():
                if node.parent is None:
                    _trees.append([u])
                    nodes.pop(u)
                else:
                    for tree in _trees:
                        if node.parent in tree:
                            tree.append(u)
                            nodes.pop(u)
        return _trees

为了测试它是否有效,我从书中的图 22.9 中举了一个例子:

在将节点 a 重命名为 h 1 分别为 8 之后,我运行了以下测试:

def test_strongly_connected_components():
    edges = [(1,2), (5,1), (2,5), (5,6), (2,6), (6,7), (7,6), (2,3), (3,7), (3,4), (4,3), (4,8), (7,8), (8,8)]
    graph = Graph(edges)
    assert graph.strongly_connected_components() == [[1, 5, 2], [3, 4], [6, 7], [8]]


if __name__ == "__main__":
    pytest.main([__file__+"::test_strongly_connected_components", "-s"])

此测试通过,确认图中灰色阴影的 SCC。

然而,对于“真正的”练习,我需要使用输入文件 SCC.txt,其中包含表示边的 875,714 行(作为整数的头尾对),并输出五个最大 SCC 的大小.为此我尝试了以下测试:

@pytest.fixture
def edges():
    with open('SCC.txt') as f:
        return [tuple(map(int, line.split())) for line in f.read().splitlines()]

def test_SCC_on_full_graph(edges):
    graph = Graph(edges)
    SCCs = graph.strongly_connected_components()
    print([map(len, SCCs)].sort(reverse=True))      # Read off the size of the largest SCCs


if __name__ == "__main__":
    pytest.main([__file__+"::test_SCC_on_full_graph", "-s"])

但是,我遇到了RuntimeError: maximum recursion depth exceeded in cmp

_ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ 

self = <scc.Graph object at 0x103253690>, u = 209099

    def dfs_visit(self, u):
            self.time += 1
            self.nodes[u].d = self.time
            self.nodes[u].color = 'gray'
            for v in self.adj[u]:
>                   if self.nodes[v].color == 'white':
E                   RuntimeError: maximum recursion depth exceeded in cmp

scc.py:53: RuntimeError
========================== 1 failed in 21.79 seconds ===========================

我读过有关增加sys.setrecursionlimit 的信息,但这似乎不是推荐的做法。除了我不确定如何改进代码,因为它完全实现了书中给出的伪代码。关于如何克服此错误的任何想法?

【问题讨论】:

    标签: python algorithm recursion graph depth-first-search


    【解决方案1】:

    我设法使用增加了stack_size 和递归限制的threading 库解决了这个问题。这是解决方案的代码:

    import sys
    import pytest
    from collections import OrderedDict
    import copy
    import threading
    
    
    class Node(object):
        def __init__(self, color='white', parent=None, d=None, f=None):
            self.color = color
            self.parent = parent
            self.d = d          # Discovery time
            self.f = f          # Finishing time
    
    
    class Graph(object):
        def __init__(self, edges, node_indices=None):
            self.edges = edges
            self.nodes = self.initialize_nodes(node_indices )
            self.adj = self.initialize_adjacency_list()
            self.trees = dict()
    
        def initialize_nodes(self, node_indices=None):
            if node_indices is None:
                node_indices = sorted(list(set(node for edge in self.edges for node in edge)))
            return OrderedDict([(node_index, Node()) for node_index in node_indices])
    
        def initialize_adjacency_list(self):
            A = {node: [] for node in self.nodes}
            for edge in self.edges:
                u, v = edge
                A[u].append(v)
            return A
    
        def dfs(self):
            self.time = 0
            for u, node in self.nodes.items():
                if node.color == 'white':
                    self.dfs_visit(u, root=u)
    
        def dfs_visit(self, u, root=None):
            if u == root:
                self.trees[root] = set()
            self.time += 1
            self.nodes[u].d = self.time
            self.nodes[u].color = 'gray'
            for v in self.adj[u]:
                if self.nodes[v].color == 'white':
                    self.nodes[v].parent = u
                    self.trees[root].add(v)
                    self.dfs_visit(v, root=root)
            self.nodes[u].color = 'black'
            self.time += 1
            self.nodes[u].f = self.time
    
        @staticmethod
        def transpose(edges):
            return [(v,u) for (u,v) in edges]
    
        def strongly_connected_components(self):
            self.dfs()
            finishing_times = {u: node.f for u, node in self.nodes.items()}
            self.__init__(self.transpose(self.edges))
            node_indices = sorted(finishing_times, key=finishing_times.get, reverse=True)
            self.nodes = self.initialize_nodes(node_indices)
            self.dfs()
    
            trees = copy.deepcopy(self.trees)
            for k, v in trees.items():
                v.add(k)
            return trees.values()
    
    
    @pytest.fixture
    def edges():
        with open('SCC.txt') as f:
            return [tuple(map(int, line.split())) for line in f.read().splitlines()]
    
    def SCC_on_full_graph():
        E = edges()
        graph = Graph(E)
        SCCs = graph.strongly_connected_components()
    
        SCC_sizes = sorted(list(map(len, SCCs)), reverse=True)
        print(SCC_sizes[:5])                            # Read off the size of the 5 largest SCCs
    
    
    if __name__ == "__main__":
        threading.stack_size(67108864)
        sys.setrecursionlimit(2**20)
        thread = threading.Thread(target=SCC_on_full_graph)
        thread.start()
    

    【讨论】:

      【解决方案2】:

      DFS 在逻辑上必须是 DFS,但您可以通过编程方式尝试解决方法。

      1. 以这样一种方式编写 DFS,如果它接近递归限制,您可以从顶级函数之一重试它。

      2. 尝试使用多处理。

      PS: 更大的数据集是否可能发生无限递归?使用较大数据集时出现的逻辑错误。 如果您有增量大小的数据集,您还可以确定算法在 python 中实现的限制。

      【讨论】:

        猜你喜欢
        • 2017-03-18
        • 2015-04-15
        • 1970-01-01
        • 1970-01-01
        • 1970-01-01
        • 2013-02-20
        • 2023-01-30
        • 1970-01-01
        • 1970-01-01
        相关资源
        最近更新 更多