aboutsummaryrefslogtreecommitdiff
path: root/ass1/binary_boyermoore.py
diff options
context:
space:
mode:
Diffstat (limited to 'ass1/binary_boyermoore.py')
-rw-r--r--ass1/binary_boyermoore.py80
1 files changed, 24 insertions, 56 deletions
diff --git a/ass1/binary_boyermoore.py b/ass1/binary_boyermoore.py
index a4d286d..f226f6b 100644
--- a/ass1/binary_boyermoore.py
+++ b/ass1/binary_boyermoore.py
@@ -98,69 +98,37 @@ def boyer_moore(pat, txt):
comps = 0
print("="*15)
- print(6*" " + txt)
+ # print(6*" " + txt)
+ i = m-1
while j <= n-m:
- matches = 0
- for i in range(m-1, -1, -1):
- # if galil_index == j and start <= i < stop:
- # print("pee")
- # i = max(start + 1, 1)
- # continue
-
- print(f"{j=:02} {' ' * j}", end="")
- for x in range(len(pat)):
- if x == i:
- print(pat[x].upper(), end="")
- else:
- print(pat[x], end="")
- print()
- match = pat[i] == txt[j+i]
- comps += 1
- if match:
- matches += 1
- if matches == m:
- good_suffix_shift = m - matched_prefix[1]
- j += good_suffix_shift
- i = m-1
- occurrence += 1
- break
- else:
- mismatched = txt[j+i]
- # bad_char_shift = i-R[alpha_number(mismatched)][i]
-
- good_suffix_shift = 1
- if good_suffix[i+1] > 0:
- good_suffix_shift = m - good_suffix[i+1]
- start = good_suffix[i+1] - m + i
- stop = good_suffix[i+1]
- next_galil = j+1
- elif good_suffix[i+1] == 0:
- good_suffix_shift = m - matched_prefix[i+1]
- start = 1
- stop = matched_prefix[i+1]
- next_galil = j+1
- elif matches == m:
- print(f"Match at {j}")
- good_suffix_shift = m - matched_prefix[1]
- # assert good_suffix[i+1] != 0
- # print(start, stop)
+ match = pat[i] == txt[j+i]
+ comps += 1
+ if match:
+ if i == 0:
+ good_suffix_shift = m - matched_prefix[1]
j += good_suffix_shift
- # print(good_suffix_shift, bad_char_shift)
- # if good_suffix_shift >= bad_char_shift:
- # print("good suff", good_suffix_shift)
- # else:
- # print("bad char", bad_char_shift)
- # print(i)
- # if good_suffix[i+1] >= 0 and good_suffix_shift >= bad_char_shift:
- # galil_index = j
- break
+ occurrence += 1
+ i = m-1
+ else:
+ i -= 1
+ else:
+ good_suffix_shift = 1
+ if good_suffix[i+1] > 0:
+ good_suffix_shift = m - good_suffix[i+1]
+ elif good_suffix[i+1] == 0:
+ good_suffix_shift = m - matched_prefix[i+1]
+ j += good_suffix_shift
+ i = m-1
print(f"It found {occurrence} occurences.")
- print(f"\n {list(range(m))}")
+ # print(f"\n {list(range(m))}")
+ print("" + str(list(map(int, pat))))
# for i, a in enumerate(R):
# print(chr(i+97), a)
print(good_suffix)
+ print(matched_prefix)
print(f"{comps} comparisons.")
-boyer_moore("010010", "101010111010010101110111010101110100101011101101111011111111111101110111010101110100101011101101101110111010101110100101011101101101110110000110101011101001010111011011011101100001010101110100101011101110101011101001010111011011011101110101011101001010111011011011101110101011101001010111011011011101100001101010111010010101110110110111011000010111011111011101110110101110110101101100000001011001010101010101110111110111011101101011101101011011000000010110010101010101000010111011111011101110110101110110101101100000001011001010101010100001011101111101110111011010111011010110110000000101100101010101010101011101001010111011011011101100001011101111101110111011010101110100101011101101101110110000101110111110101010111010010101110110110111011000010111011101010111010010101110110110111011000010111010101110100101011101101101010101110100101011101101101110110000101110111110111011101101011101101011011000000010110010101010101111011000010111011111011101110110101110110101101100000001011001010101010110111110111011101101011101101011011000000010110010101010101111011101110110101110110101101100000001011001010101010111101110110101110110101101100000001011001010101010110101110110101101100000001011001010101010110110111011000010101011101001010111011101010111010010101110110110111011101010111010010101110110110111011101010111010010101110110110111011000011010101110100101011101101101110110000101110111110111011101101011101101011011000000010110010101010101011101111101110111011010111011010110110000000101100101010101010000101110111110111011101101011101101011011000000010110010101010101000010111011111011101110110101110110101101100000001011001010101010101010111010010101110110110111011000010111011111011101110110101011101001010111011011011101100001011101111101010101110100101011101101101110110000101110111010101110100101011101101101110110000101110101011101001010111011011010101011101001010111011011011101100001011101111101110111011010111011010110110000000101100101010101011110110000101110111110111011101101011101101011011000000010110010101010101101111101110111011010111011010110110000000101100101010101011110111011101101011101101011011000000010110010101010101111011101101011101101011011000000010110010101010101101011101101011011000000010110010101010101101101110110000101110111110111011101101011101101011011000000010110010101010101101110111110111011101101011101101011011000000010110010101010101101110111110111011101101011101101011011000000010110010101010101011101111101110111011010111011010110110000000101100101010101010000101110111110111011101101011101101011011000000010110010101010101000010111011111011101110110101110110101101100000001011001010101010101010111101111111111111010010101110110110111011000010111011111011101110110101011101001010111011011011101100001011101111101010101110100101011101101101110110000101110111010101110100101011101101101110110000101110101011101001010111011011010101011101001010111011011011101100001011101111101110111011010111011010110110000000101100101010101011110110000101110111110111011101101011101101011011000000010110010101010101101111101110111011010111011010110110000000101100101010101011110111011101101011101101011011000000010110010101010101111011101101011101101011011000000010110010101010101101011101101011011000000010110010101010101101101110110000101110111110111011101101011101101011011000000010110010101010101") \ No newline at end of file
+boyer_moore("111000110", "01110111010101110100101011101101111011111111111111100011001110111010101110100101011101101101110111010110111010010101110110110111011111011011")
+# boyer_moore("111011011001110", "101010111010010101110111010101110100101011101101111011111111111101110111010101110100101011101101101110111010101110100101011101101101110111110110110011100000110101011101001010111011011011101100001010101110100101011101110101011101001010111011011011101110101011101001010111011011011101110101011101001010111011011011101100001101010111010010101110110110111011000010111011111011101110110101110110101101100000001011001010101010101110111110111011101101011101101011011000000010110010101010101000010111011111011101110110101110110101101100000001011001010101010100001011101111101110111011010111011010110110000000101100101010101010101011101001010111011011011101100001011101111101110111011010101110100101011101101101110110000101110111110101010111010010101110110110111011000010111011101010111010010101110110110111011000010111010101110100101011101101101010101110100101011101101101110110000101110111110111011101101011101101011011000000010110010101010101111011000010111011111011101110110101110110101101100000001011001010101010110111110111011101101011101101011011000000010110010101010101111011101110110101110110101101100000001011001010101010111101110110101110110101101100000001011001010101010110101110110101101100000001011001010101010110110111011000010101011101001010111011101010111010010101110110110111011101010111010010101110110110111011101010111010010101110110110111011000011010101110100101011101101101110110000101110111110111011101101011101101011011000000010110010101010101011101111101110111011010111011010110110000000101100101010101010000101110111110111011101101011101101011011000000010110010101010101000010111011111011101110110101110110101101100000001011001010101010101010111010010101110110110111011000010111011111011101110110101011101001010111011011011101100001011101111101010101110100101011101101101110110000101110111010101110100101011101101101110110000101110101011101001010111011011010101011101001010111011011011101100001011101111101110111011010111011010110110000000101100101010101011110110000101110111110111011101101011101101011011000000010110010101010101101111101110111011010111011010110110000000101100101010101011110111011101101011101101011011000000010110010101010101111011101101011101101011011000000010110010101010101101011101101011011000000010110010101010101101101110110000101110111110111011101101011101101011011000000010110010101010101101110111110111011101101011101101011011000000010110010101010101101110111110111011101101011101101011011000000010110010101010101011101111101110111011010111011010110110000000101100101010101010000101110111110111011101101011101101011011000000010110010101010101000010111011111011101110110101110110101101100000001011001010101010101010111101111111111111010010101110110110111011000010111011111011101110110101011101001010111011011011101100001011101111101010101110100101011101101101110110000101110111010101110100101011101101101110110000101110101011101001010111011011010101011101001010111011011011101100001011101111101110111011010111011010110110000000101100101010101011110110000101110111110111011101101011101101011011000000010110010101010101101111101110111011010111011010110110000000101100101010101011110111011101101011101101011011000000010110010101010101111011101101011101101011011000000010110010101010101101011101101011011000000010110010101010101101101110110000101110111110111011101101011101101011011000000010110010101010101") \ No newline at end of file