Skip to content

Commit 83cf578

Browse files
punithbajajcclausspoyea
authored
Add wildcard pattern matching using dynamic programming (TheAlgorithms#5334)
* Added regular expression implimentation using dp * replaced input() with example values * Apply suggestions from code review Co-authored-by: Christian Clauss <[email protected]> * changed returning value to bool and added test cases * added doctest Co-authored-by: John Law <[email protected]> * added test cases * Apply suggestions from code review Co-authored-by: John Law <[email protected]> * shifted to strings * Changed filename * Update function name to match_pattern Co-authored-by: John Law <[email protected]> * Update function name to match_pattern Co-authored-by: John Law <[email protected]> Co-authored-by: Christian Clauss <[email protected]> Co-authored-by: John Law <[email protected]>
1 parent 2e2e1b6 commit 83cf578

File tree

1 file changed

+112
-0
lines changed

1 file changed

+112
-0
lines changed

strings/wildcard_pattern_matching.py

+112
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,112 @@
1+
"""
2+
Implementation of regular expression matching with support for '.' and '*'.
3+
'.' Matches any single character.
4+
'*' Matches zero or more of the preceding element.
5+
The matching should cover the entire input string (not partial).
6+
7+
"""
8+
9+
10+
def match_pattern(input_string: str, pattern: str) -> bool:
11+
"""
12+
uses bottom-up dynamic programming solution for matching the input
13+
string with a given pattern.
14+
15+
Runtime: O(len(input_string)*len(pattern))
16+
17+
Arguments
18+
--------
19+
input_string: str, any string which should be compared with the pattern
20+
pattern: str, the string that represents a pattern and may contain
21+
'.' for single character matches and '*' for zero or more of preceding character
22+
matches
23+
24+
Note
25+
----
26+
the pattern cannot start with a '*',
27+
because there should be at least one character before *
28+
29+
Returns
30+
-------
31+
A Boolean denoting whether the given string follows the pattern
32+
33+
Examples
34+
-------
35+
>>> match_pattern("aab", "c*a*b")
36+
True
37+
>>> match_pattern("dabc", "*abc")
38+
False
39+
>>> match_pattern("aaa", "aa")
40+
False
41+
>>> match_pattern("aaa", "a.a")
42+
True
43+
>>> match_pattern("aaab", "aa*")
44+
False
45+
>>> match_pattern("aaab", ".*")
46+
True
47+
>>> match_pattern("a", "bbbb")
48+
False
49+
>>> match_pattern("", "bbbb")
50+
False
51+
>>> match_pattern("a", "")
52+
False
53+
>>> match_pattern("", "")
54+
True
55+
"""
56+
57+
len_string = len(input_string) + 1
58+
len_pattern = len(pattern) + 1
59+
60+
# dp is a 2d matrix where dp[i][j] denotes whether prefix string of
61+
# length i of input_string matches with prefix string of length j of
62+
# given pattern.
63+
# "dp" stands for dynamic programming.
64+
dp = [[0 for i in range(len_pattern)] for j in range(len_string)]
65+
66+
# since string of zero length match pattern of zero length
67+
dp[0][0] = 1
68+
69+
# since pattern of zero length will never match with string of non-zero length
70+
for i in range(1, len_string):
71+
dp[i][0] = 0
72+
73+
# since string of zero length will match with pattern where there
74+
# is at least one * alternatively
75+
for j in range(1, len_pattern):
76+
dp[0][j] = dp[0][j - 2] if pattern[j - 1] == "*" else 0
77+
78+
# now using bottom-up approach to find for all remaining lengths
79+
for i in range(1, len_string):
80+
for j in range(1, len_pattern):
81+
if input_string[i - 1] == pattern[j - 1] or pattern[j - 1] == ".":
82+
dp[i][j] = dp[i - 1][j - 1]
83+
84+
elif pattern[j - 1] == "*":
85+
if dp[i][j - 2] == 1:
86+
dp[i][j] = 1
87+
elif pattern[j - 2] in (input_string[i - 1], "."):
88+
dp[i][j] = dp[i - 1][j]
89+
else:
90+
dp[i][j] = 0
91+
else:
92+
dp[i][j] = 0
93+
94+
return bool(dp[-1][-1])
95+
96+
97+
if __name__ == "__main__":
98+
import doctest
99+
100+
doctest.testmod()
101+
# inputing the strings
102+
# input_string = input("input a string :")
103+
# pattern = input("input a pattern :")
104+
105+
input_string = "aab"
106+
pattern = "c*a*b"
107+
108+
# using function to check whether given string matches the given pattern
109+
if match_pattern(input_string, pattern):
110+
print(f"{input_string} matches the given pattern {pattern}")
111+
else:
112+
print(f"{input_string} does not match with the given pattern {pattern}")

0 commit comments

Comments
 (0)