-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathrabinkarp.py
56 lines (45 loc) · 1.64 KB
/
rabinkarp.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
'''
rabinkarp.py - Rabin-Karp algorithm for substring search.
Written by Sergey Torshin @torshin5ergey
'''
def rabin_karp(string: str, substring:str) -> int:
"""
Implements the Rabin-Karp algorithm for substring search.
Args:
string (str) -- string to search for a pattern in it
substring (str) -- pattern string to find
Returns:
int -- index of the first occurrence of the substring in the string, or -1 if not found.
"""
n = len(string)
m = len(substring)
if m > n:
return -1
# Prime modulus (big prime number) to minimize collisions
q = 1000000007 # Commonly used number
# Alphabet size, 256 for ASCII
d = 256
# Hash calculation
hash_substring = 0
hash_string = 0
# Calculate hash for string and substring
for c in range(m): # For first m chars
# Calculating with simplified iterative equation
hash_substring = (hash_substring * d + ord(substring[c])) % q
hash_string = (hash_string * d + ord(string[c])) % q
# Check and slide the substring pattern window
for i in range(n - m + 1):
if hash_string == hash_substring:
# Additional check
if string[i:i+m] == substring:
return i
# Calculate hash value for the next pattern window
if i < n - m:
hash_string = (d * (hash_string - ord(string[i]) * pow(d, m-1)%q) + ord(string[i + m])) % q
return -1 # Not found
def main():
string = input("Enter a string:\n")
substring = input("Enter a substring:\n")
print(rabin_karp(string, substring))
if __name__ == "__main__":
main()