Python | 正規表現の性能とアンチパターン（上級向け）

Python

2022.03.192025.11.05

では、先ほどの Notebook をさらに発展させて、爆発的バックトラッキングの試行回数が指数的に増える様子をアニメーションで可視化する教材にします。

Python では matplotlib.animation を使って、(a+)+ のパターンに対するバックトラック試行の増加を視覚化できます。

Notebook アニメーション化例
1. 説明
2. Notebook 全体の流れ

Notebook アニメーション化例

# ==========================
# セル7: バックトラック試行回数のアニメーション
# ==========================
import matplotlib.pyplot as plt
import matplotlib.animation as animation

# シンプルモデル：文字列長 n に対するバックトラック試行回数を指数関数でシミュレーション
n_max = 15
x = list(range(1, n_max+1))
# (a+)+ で試行回数は 2^(n-1) に近似
y = [2**(i-1) for i in x]

fig, ax = plt.subplots()
line, = ax.plot([], [], 'ro-', lw=2)
ax.set_xlim(0, n_max+1)
ax.set_ylim(0, max(y)*1.1)
ax.set_xlabel('文字列長 n')
ax.set_ylabel('バックトラック試行回数')
ax.set_title('Catastrophic Backtrackingの試行回数増加')

def init():
    line.set_data([], [])
    return line,

def animate(i):
    line.set_data(x[:i+1], y[:i+1])
    return line,

ani = animation.FuncAnimation(fig, animate, frames=n_max, init_func=init, blit=True, repeat=False)
plt.show()

# ==========================
# セル7: バックトラック試行回数のアニメーション
# ==========================
import matplotlib.pyplot as plt
import matplotlib.animation as animation

# シンプルモデル：文字列長 n に対するバックトラック試行回数を指数関数でシミュレーション
n_max = 15
x = list(range(1, n_max+1))
# (a+)+ で試行回数は 2^(n-1) に近似
y = [2**(i-1) for i in x]

fig, ax = plt.subplots()
line, = ax.plot([], [], 'ro-', lw=2)
ax.set_xlim(0, n_max+1)
ax.set_ylim(0, max(y)*1.1)
ax.set_xlabel('文字列長 n')
ax.set_ylabel('バックトラック試行回数')
ax.set_title('Catastrophic Backtrackingの試行回数増加')

def init():
    line.set_data([], [])
    return line,

def animate(i):
    line.set_data(x[:i+1], y[:i+1])
    return line,

ani = animation.FuncAnimation(fig, animate, frames=n_max, init_func=init, blit=True, repeat=False)
plt.show()