Init (add codebase)

2021-11-14 14:35:05 +01:00 · 2021-11-14 14:35:05 +01:00 · bacd7cff71
commit bacd7cff71
parent d10424819c
43 changed files with 174555 additions and 2 deletions
--- a/48
+++ b/48
@ -0,0 +1,48 @@
 CC = cc # C compiler
 # cc and gcc is the same
 CXX = c++ # C++ compiler
 # c++
 # g++
 # clang++
 CPPFLAGS = # preprocessor flags
 CFLAGS = -Wall -Wfloat-equal -std=c99 -O0 -mtune=native -funroll-loops $(OPT) # C compiler flags
 # -Wall: Warnings all
 # -Wfloat-equal: Warn if comparing floats with ==
 # -OX: Optimization level -O0 (none, default), -O1, -O2, -O3 (most, may increase file size), -Os (decrease file size), -ffast-math
 # -mtune: Tune for specific/generic CPU
 # -funrool-loops: Unroll loops when compiling
 # -fopenmp: Enable OpenMP (When running, set the environmental variable OMP_NUM_THREADS)
 # $(OPT): Passes any parameter given when calling make with 'make OPT=...'
 CXXFLAGS = -Wall -std=c++20 -O0 # C++ compiler flags
 LDFLAGS = # linker flags
 LDLIBS = # library flags
 # -lm (for <math.h>)
 # -lblas (BASIC LINEAR ALGEBRA SUBPROGRAMS)
 # -lcblas (for <cblas.h>)
 # -lopenblas (NOT INSTALLED; blas and cblas in one; conflicts with blas and cblas)
 # -llapack (LAPACKE)
 # -llapacke (LAPACK) NOTE: The order of "-llapacke -llapack -lblas" is very important
 #LINK.o = $(CXX) $(LDFLAGS) # use CXX for linking
 simple_string_matching: simple_string_matching.o Rabin_fingerprint.o general_library.o
 	$(CXX) $(CXXFLAGS) simple_string_matching.o Rabin_fingerprint.o general_library.o -o simple_string_matching
 simple_string_matching.o: simple_string_matching.cpp
 	$(CXX) $(CXXFLAGS) -c simple_string_matching.cpp
 Rabin_fingerprint.o: Rabin_fingerprint.cpp Rabin_fingerprint.hpp
 	$(CXX) $(CXXFLAGS) -c Rabin_fingerprint.cpp
 general_library.o: general_library.cpp general_library.hpp
 	$(CXX) $(CXXFLAGS) -c general_library.cpp
 porat-porat: porat-porat.cpp
 # Tell the compiler that 'clean' isn't referring to a file
 .PHONY: clean
 # A make target that cleans (by deleting files)
 clean:
 	$(RM) porat-porat
 	$(RM) simple_string_matching
 	$(RM) *.o
--- a/README.md
+++ b/README.md
@ -1,3 +1,33 @@
-# Bachelors_Thesis_Code
+# Bachelor's_Thesis_Code
 Code used for my Bachelor's Thesis
 # Versions
 ## Current Version
 Compared to V1, this current state `generate_initial_irreducible_polynomials.sage`, `generate_random_irreducible_polynomial.sage`, and `multiply_polynomials_modulo_polynomial.sage` have been removed from the main folder, as they have already been used for implementing their corresponding features in `general_library.cpp`. They will be preserved in the V1 folder.  
 This version also contains code relating to Porat-Porat and other random code stumps. This code is going to be completely reimplemented, but is preserved for now to avoid redoing work.  
 ## V1
 #### `general_library.cpp`
 - Exports functions for:  
    - Generating a random irreducible polynomial of degree up to 31.  
 - Contains code for:  
    - Contains code to multiply polynomials modulo another polynomial.  
    - Doesn't contain code to initially calculate modulo a polynomial. It requires the initial polynomials to all be at most of the same degree as the polynomial that you use for modulo.  
    - A very custom version of calculating Reduced Row Echelon Form assuming all values are in Z2.  
 #### `generate_initial_irreducible_polynomials.sage`
 - Generates a list of irreducible polynomials, one of each degree. The polynomials are printed in a format that can be copy-pasted directly into `general_library.cpp`.  
 #### `generate_random_irreducible_polynomial.sage`
 - Contains an general template of how `general_library.cpp` should implement generating a random irreducible polynomial. The output of this program can also be used for debugging, since it uses many (correctly implemented) built-in sagemath functions that have to manually implemented in `general_library.cpp`.  
 #### `multiply_polynomials_modulo_polynomial.sage`
 - Contains a general template of how `general_library.cpp` should implement multiplying polynomials modulo a polynomial in Z2.  
 #### `compare_fingerprint_false_positive_probabilities.sage`
 - Contains initial (i.e. very rouch) code, which compares the upper bounds of a false match occuring of the Rabin fingerprint and the fingerprint used in Karp-Rabin.  
 #### `test_rabin_fingerprint.sage`
 - Contains initial (i.e. very rough) code which debunks my theory that modulo a prime is somewhat equivalent to modulo an irreducible polynomial.  
--- a/Rabin_fingerprint.cpp
+++ b/Rabin_fingerprint.cpp
@ -0,0 +1,73 @@
 #include "Rabin_fingerprint.hpp"
 Rabin_fingerprint::Rabin_fingerprint(uint32_t p, size_t window_size_in_bits) {
    set_modulo_polynomial(p);
    set_shift_polynomial(window_size_in_bits);
 }
 void Rabin_fingerprint::set_modulo_polynomial (uint32_t p) {
    polynomial = p & ((uint32_t)pow(2, 31)-1);
 }
 void Rabin_fingerprint::set_shift_polynomial (size_t window_size_in_bits) {
    #ifndef NDEBUG
    if (polynomial == 0)
        throw std::logic_error("Call set_modulo_polynomial first, as this function depends on the polynomial variable being set.");
    #endif
    shift_polynomial = 1;
    // NOTE: We shift the bit 1 space too long, since we are removing the bit that has been pushed outside the window
    for (size_t i = 0; i < window_size_in_bits; i++) {
        shift_polynomial <<= 1;
        if ((shift_polynomial & (uint32_t)pow(2, 31)) != 0)
            shift_polynomial ^= polynomial;
    }
 }
 void Rabin_fingerprint::push_char (char c) {
    std::bitset<8> b(c);
    for (char i = 7; i >= 0; i--) {
        push_bit((bool)b[i]);
    }
 }
 void Rabin_fingerprint::push_bit (bool b) {
    fingerprint <<= 1;
    fingerprint |= b;
    if ((fingerprint & (uint32_t)pow(2, 31)) != 0)
        fingerprint ^= polynomial;
 }
 void Rabin_fingerprint::shift_bit (bool b) {
    #ifndef NDEBUG
    if (shift_polynomial == 0)
        throw std::logic_error("Call set_shift_polynomial first, as this function depends on the shift_polynomial variable being set.");
    #endif
    if (b)
        fingerprint ^= shift_polynomial;
 }
 void Rabin_fingerprint::slide_char (char c_in, char c_out) {
    std::bitset<8> b_in(c_in);
    std::bitset<8> b_out(c_out);
    for (char i = 7; i >= 0; i--) {
        slide_bit((bool)b_in[i], (bool)b_out[i]);
    }
 }
 /* #include <iostream> */
 void Rabin_fingerprint::slide_bit (bool b_in, bool b_out) {
    /* std::cout << "bitset b(c):  " << b << std::endl; */
        /* std::cout << "push bit " << b[i] << std::endl; */
    /* std::cout << "push bit " << b_in << std::endl; */
    push_bit(b_in);
    /* std::cout << "shift bit " << b_out << std::endl; */
    shift_bit(b_out);
 }
 uint32_t Rabin_fingerprint::get_fingerprint () {
    return fingerprint;
 }
--- a/Rabin_fingerprint.hpp
+++ b/Rabin_fingerprint.hpp
@ -0,0 +1,30 @@
 #ifndef RABIN_FINGERPRINT_H
 #define RABIN_FINGERPRINT_H
 #include <stdint.h>
 #include <bitset>
 #include <math.h>
 #include <stdexcept>
 class Rabin_fingerprint {
    public:
        Rabin_fingerprint(uint32_t polynomial, size_t window_size_in_bits);
        void push_char (char c);
        void push_bit (bool b);
        void shift_bit (bool b);
        void slide_char (char c_in, char c_out);
        void slide_bit (bool b1, bool b2);
        uint32_t get_fingerprint();
    private:
        void set_modulo_polynomial (uint32_t p);
        void set_shift_polynomial (size_t window_size_in_bits);
        uint32_t fingerprint = 0;
        uint32_t polynomial = 0;
        uint32_t shift_polynomial = 0;
 };
 #endif
--- a/V1/Makefile
+++ b/V1/Makefile
@ -0,0 +1,46 @@
 CC = cc # C compiler
 # cc and gcc is the same
 CXX = c++ # C++ compiler
 # c++
 # g++
 # clang++
 CPPFLAGS = # preprocessor flags
 CFLAGS = -Wall -Wfloat-equal -std=c99 -O0 -mtune=native -funroll-loops $(OPT) # C compiler flags
 # -Wall: Warnings all
 # -Wfloat-equal: Warn if comparing floats with ==
 # -OX: Optimization level -O0 (none, default), -O1, -O2, -O3 (most, may increase file size), -Os (decrease file size), -ffast-math
 # -mtune: Tune for specific/generic CPU
 # -funrool-loops: Unroll loops when compiling
 # -fopenmp: Enable OpenMP (When running, set the environmental variable OMP_NUM_THREADS)
 # $(OPT): Passes any parameter given when calling make with 'make OPT=...'
 CXXFLAGS = -Wall -std=c++20 -O0 # C++ compiler flags
 LDFLAGS = # linker flags
 LDLIBS = # library flags
 # -lm (for <math.h>)
 # -lblas (BASIC LINEAR ALGEBRA SUBPROGRAMS)
 # -lcblas (for <cblas.h>)
 # -lopenblas (NOT INSTALLED; blas and cblas in one; conflicts with blas and cblas)
 # -llapack (LAPACKE)
 # -llapacke (LAPACK) NOTE: The order of "-llapacke -llapack -lblas" is very important
 #LINK.o = $(CXX) $(LDFLAGS) # use CXX for linking
 simple_string_matching: simple_string_matching.o Rabin_fingerprint.o general_library.o
 	$(CXX) $(CXXFLAGS) simple_string_matching.o Rabin_fingerprint.o general_library.o -o simple_string_matching
 simple_string_matching.o: simple_string_matching.cpp
 	$(CXX) $(CXXFLAGS) -c simple_string_matching.cpp
 Rabin_fingerprint.o: Rabin_fingerprint.cpp Rabin_fingerprint.hpp
 	$(CXX) $(CXXFLAGS) -c Rabin_fingerprint.cpp
 general_library.o: general_library.cpp general_library.hpp
 	$(CXX) $(CXXFLAGS) -c general_library.cpp
 # Tell the compiler that 'clean' isn't referring to a file
 .PHONY: clean
 # A make target that cleans (by deleting files)
 clean:
 	$(RM) simple_string_matching
 	$(RM) *.o
--- a/V1/Rabin_fingerprint.cpp
+++ b/V1/Rabin_fingerprint.cpp
@ -0,0 +1,68 @@
 #include "Rabin_fingerprint.hpp"
 Rabin_fingerprint::Rabin_fingerprint(uint32_t p, size_t window_size_in_bits) {
    set_modulo_polynomial(p);
    set_shift_polynomial(window_size_in_bits);
 }
 void Rabin_fingerprint::set_modulo_polynomial (uint32_t p) {
    polynomial = p & ((uint32_t)pow(2, 31)-1);
 }
 void Rabin_fingerprint::set_shift_polynomial (size_t window_size_in_bits) {
    #ifndef NDEBUG
    if (polynomial == 0)
        throw std::logic_error("Call set_modulo_polynomial first, as this function depends on the polynomial variable being set.");
    #endif
    shift_polynomial = 1;
    // NOTE: We shift the bit 1 space too long, since we are removing the bit that has been pushed outside the window
    for (size_t i = 0; i < window_size_in_bits; i++) {
        shift_polynomial <<= 1;
        if ((shift_polynomial & (uint32_t)pow(2, 31)) != 0)
            shift_polynomial ^= polynomial;
    }
 }
 void Rabin_fingerprint::push_char (char c) {
    std::bitset<8> b(c);
    for (char i = 7; i >= 0; i--) {
        push_bit((bool)b[i]);
    }
 }
 void Rabin_fingerprint::push_bit (bool b) {
    fingerprint <<= 1;
    fingerprint |= b;
    if ((fingerprint & (uint32_t)pow(2, 31)) != 0)
        fingerprint ^= polynomial;
 }
 void Rabin_fingerprint::shift_bit (bool b) {
    #ifndef NDEBUG
    if (shift_polynomial == 0)
        throw std::logic_error("Call set_shift_polynomial first, as this function depends on the shift_polynomial variable being set.");
    #endif
    if (b)
        fingerprint ^= shift_polynomial;
 }
 void Rabin_fingerprint::slide_char (char c_in, char c_out) {
    std::bitset<8> b_in(c_in);
    std::bitset<8> b_out(c_out);
    for (char i = 7; i >= 0; i--) {
        slide_bit((bool)b_in[i], (bool)b_out[i]);
    }
 }
 void Rabin_fingerprint::slide_bit (bool b_in, bool b_out) {
    push_bit(b_in);
    shift_bit(b_out);
 }
 uint32_t Rabin_fingerprint::get_fingerprint () {
    return fingerprint;
 }
--- a/V1/Rabin_fingerprint.hpp
+++ b/V1/Rabin_fingerprint.hpp
@ -0,0 +1,30 @@
 #ifndef RABIN_FINGERPRINT_H
 #define RABIN_FINGERPRINT_H
 #include <stdint.h>
 #include <bitset>
 #include <math.h>
 #include <stdexcept>
 class Rabin_fingerprint {
    public:
        Rabin_fingerprint(uint32_t polynomial, size_t window_size_in_bits);
        void push_char (char c);
        void push_bit (bool b);
        void shift_bit (bool b);
        void slide_char (char c_in, char c_out);
        void slide_bit (bool b1, bool b2);
        uint32_t get_fingerprint();
    private:
        void set_modulo_polynomial (uint32_t p);
        void set_shift_polynomial (size_t window_size_in_bits);
        uint32_t fingerprint = 0;
        uint32_t polynomial = 0;
        uint32_t shift_polynomial = 0;
 };
 #endif
--- a/V1/compare_fingerprint_false_positive_probabilities.sage
+++ b/V1/compare_fingerprint_false_positive_probabilities.sage
@ -0,0 +1,73 @@
 # Rabin fingerprint: k > lg(n*m/e), e is the upper bound on the error probability
 # Karp-Rabin fingerprint: <= pi(n(n-m+1))/pi(M)
 # 32-bit
 M = 2**32-1
 k = 31
 # 16-bit
 # M = 2**16-1
 # k = 13
 def fpi(a):
    p = Primes()
    a_next = p.next(a)
    i = 0
    jump = 1
    lastdirection = -2
    while(True):
        print(f'{jump:010d}', end='\r')
        # print(f'{i}, {jump}')
        val = p.unrank(i)
        if val == a_next:
            return i # i-1, is the value we search for, but we count from 0, so i is correct
        elif val > a_next:
            if lastdirection == 2:
                # print('mul')
                lastdirection -= 1
                jump *= 2
            else:
                # print('div')
                jump //= 2
            lastdirection += 1
            # print(jump)
            i -= jump
        else:
            if lastdirection == -2:
                # print('mul')
                lastdirection += 1
                jump *= 2
            else:
                # print('div')
                jump //= 2
            lastdirection -= 1
            i += jump
 # Rabin fingerprint
 # k = lg(n*m/e) <=>
 # 2^k = n*m/e <=>
 # 2^k/(n*m) = 1/e <=>
 # n*m/(2^k) = e
 # Karp-Rabin fingerprint
 # e = pi(n(n-m+1))/pi(M)
 # print(pi(2**32-1))
 # e_rabin = n*m/(2^k)
 piM = fpi(M)
 for m in [1, 10, 100, 1000, 10000, 100000, 1000000, 10000000]:
    for n in [10, 100, 1000, 10000, 100000, 1000000, 10000000, 100000000]:
        if m>=n:
            continue
        print(f'(n, m) = ({n}, {m})')
        e_rabin = n*m/(2**k)
        print(f'Rabin: {float(e_rabin):.2e}')
        e_karpr = fpi(n*(n-m+1))/piM
        print(f'KarpR: {float(e_karpr):.2e}')
        print()
        print(f'{e_karpr} >= 1 is {e_karpr >= 1} | {e_rabin} >= 1 is {e_rabin >= 1}')
        if float(e_karpr) >= 1 or float(e_rabin) >= 1:
            break
--- a/V1/general_library.cpp
+++ b/V1/general_library.cpp
@ -0,0 +1,184 @@
 #include "general_library.hpp"
 // SECTION: Functions related to calculating with polynomials in Z2[x]
 uint32_t irreducible_polynomials[] {
    0b11,                              // irreducible polynomial of degree 1
    0b111,                             // irreducible polynomial of degree 2
    0b1011,                            // irreducible polynomial of degree 3
    0b10011,                           // irreducible polynomial of degree 4
    0b100101,                          // irreducible polynomial of degree 5
    0b1011011,                         // irreducible polynomial of degree 6
    0b10000011,                        // irreducible polynomial of degree 7
    0b100011101,                       // irreducible polynomial of degree 8
    0b1000010001,                      // irreducible polynomial of degree 9
    0b10001101111,                     // irreducible polynomial of degree 10
    0b100000000101,                    // irreducible polynomial of degree 11
    0b1000011101011,                   // irreducible polynomial of degree 12
    0b10000000011011,                  // irreducible polynomial of degree 13
    0b100000010101001,                 // irreducible polynomial of degree 14
    0b1000000000110101,                // irreducible polynomial of degree 15
    0b10000000000101101,               // irreducible polynomial of degree 16
    0b100000000000001001,              // irreducible polynomial of degree 17
    0b1000001010000000011,             // irreducible polynomial of degree 18
    0b10000000000000100111,            // irreducible polynomial of degree 19
    0b100000000011011110011,           // irreducible polynomial of degree 20
    0b1000000000000001100101,          // irreducible polynomial of degree 21
    0b10000000001111101100001,         // irreducible polynomial of degree 22
    0b100000000000000000100001,        // irreducible polynomial of degree 23
    0b1000000011110011010101001,       // irreducible polynomial of degree 24
    0b10000000000000000101000101,      // irreducible polynomial of degree 25
    0b100000000000100010111010011,     // irreducible polynomial of degree 26
    0b1000000000000001011010101101,    // irreducible polynomial of degree 27
    0b10000000000000010000011100101,   // irreducible polynomial of degree 28
    0b100000000000000000000000000101,  // irreducible polynomial of degree 29
    0b1000000000000110010100010101111, // irreducible polynomial of degree 30
    0b10000000000000000000000000001001 // irreducible polynomial of degree 31
 };
 size_t degree (uint32_t polynomial) {
    return 31 - __builtin_clz(polynomial);
 }
 uint32_t multiply_modulo_polynomials_in_Z2 (uint32_t q1, uint32_t q2, uint32_t p) {
    size_t p_degree = degree(p);
    size_t q1_degree = degree(q1);
    size_t q2_degree = degree(q2);
    if (q1_degree > p_degree)
        throw std::logic_error("We only support multiply-modulo whenever the multiplied polynomials are initially at most the same degree as the modulo polynomial.");
    if (q1_degree == p_degree)
        q1 ^= p;
    uint32_t arr[q2_degree+1];
    arr[0] = q1;
    for (size_t i = 1; i <= q2_degree; i++) {
        arr[i] = arr[i-1]<<1;
        if (degree(arr[i]) == p_degree)
            arr[i] ^= p;
    }
    uint32_t sum = 0;
    std::bitset<32> b(q2);
    for (size_t i = 0; i <= q2_degree; i++) {
        if (b[i] == 1)
            sum ^= arr[i];
    }
    return sum;
 }
 uint32_t polynomial_power_in_Z2(uint32_t q, uint32_t exp, uint32_t p) {
    if (exp == 0)
        return 1;
    if (degree(q) == degree(p))
        q ^= p;
    size_t log2exp = degree(exp) + 1;
    uint32_t arr[log2exp];
    arr[0] = q;
    for (size_t i = 1; i < log2exp; i++)
        arr[i] = multiply_modulo_polynomials_in_Z2(arr[i-1], arr[i-1], p);
    uint32_t res = 1;
    std::bitset<32> b(exp);
    for (size_t i = 0; i <= log2exp; i++) {
        if (b[i] == 1)
            res = multiply_modulo_polynomials_in_Z2(res, arr[i], p);
    }
    return res;
 }
 void rref_Z2(std::vector<std::bitset<32>> &A, size_t m, size_t n) {
    if (m > 31 || n > 32)
        throw std::logic_error("We only support rref_Z2 for up to a (31x32)-matrix.");
    // calculate row echelon form
    // https://en.wikipedia.org/wiki/Gaussian_elimination#Pseudocode
    size_t h = 0; // Initialization of the pivot row
    size_t k = 0; // Initialization of the pivot column
    while (h < m && k < n) {
        // Find the k-th pivot:
        int i_max = -1;
        for (size_t i = h; i < m; i++) {
            if (A[i][k]) {
                i_max = i;
                break;
            }
        }
        if (i_max == -1) {
            // No pivot in this column, pass to next column
            k++;
        } else {
            auto tmp = A[i_max];
            A[i_max] = A[h];
            A[h] = tmp;
            // Do for all rows below pivot:
            for (size_t i = h+1; i < m; i++){
                bool f = A[i][k];
                if (f == 0)
                    continue;
                // Fill with zeros the lower part of pivot column:
                A[i][k] = 0;
                // Do for all remaining elements in current row:
                for (size_t j = k+1; j<n; j++) {
                    A[i][j] = A[i][j] ^ A[h][j];
                }
            }
            // Increase pivot row and column
            h++;
            k++;
        }
    }
    // Perform back substitution
    for (size_t i = 1; i < m; i++) {
        for (size_t j = 0; j < i; j++) {
            if (A[j][i] == 1) {
                for (size_t l = i; l < n; l++) // check this
                    A[j][l] = A[j][l] ^ A[i][l];
            }
        }
    }
 }
 uint32_t get_random_irreducible_polynomial_in_Z2 (size_t k) {
    if (k > 31)
        throw std::logic_error("We only support polynomials of degree 31 or less.");
    uint32_t init_p = irreducible_polynomials[k-1];
    srand(time(0));
    uint32_t gamma = (rand() % (((uint32_t)1 << (k+1)) - 2)) + 2; // gamma in GF(2^k)\GF(2)
    uint32_t gamma_pow[k+1];
    for (size_t i = 0; i <= k; i++)
        gamma_pow[i] = polynomial_power_in_Z2(gamma, i, init_p);
    // Create an array of the polynomials in gamma_pow, and transpose it at the same time
    std::vector<std::bitset<32>> A(k); // NOTE: That 32 > 31 >= k
    for (size_t i = 0; i < k; i++) {
        for (size_t j = 0; j <= k; j++) {
            A[i][k-j] = gamma_pow[j] & ((uint32_t)1<<i);
        }
    }
    rref_Z2(A, k, k+1);
    std::bitset<32> bp;
    for (size_t i = 0; i < k; i++) {
        bp[i] = A[i][k];
    }
    bp[k] = 1;
    uint32_t p = (uint32_t)bp.to_ulong();
    return p;
 }
--- a/V1/general_library.hpp
+++ b/V1/general_library.hpp
@ -0,0 +1,14 @@
 #ifndef GENERAL_LIBRARY_H
 #define GENERAL_LIBRARY_H
 #include <stdlib.h>
 #include <stdint.h>
 #include <stdexcept>
 #include <vector>
 #include <bitset>
 #include <iostream>
 // SECTION: Functions related to calculating with polynomials in Z2[x]
 uint32_t get_random_irreducible_polynomial_in_Z2 (size_t k);
 #endif
--- a/V1/generate_initial_irreducible_polynomials.sage
+++ b/V1/generate_initial_irreducible_polynomials.sage
@ -0,0 +1,12 @@
 F = GF(2)
 PR = PolynomialRing(F, 'x')
 max_k = 31
 whitespace = max_k+1
 for i in range(1, max_k+1):
    poly_int = '0b'+ ''.join(map(str, PR.irreducible_element(i).coefficients(sparse=False)[::-1]))
    poly_int += ','
    poly_int += ' '*(max_k-i)
    print(f'    {poly_int}// irreducible polynomial of degree {i}')
--- a/V1/generate_random_irreducible_polynomial.sage
+++ b/V1/generate_random_irreducible_polynomial.sage
@ -0,0 +1,96 @@
 k = 31
 F = GF(2)
 E = GF(2^k)
 PR = PolynomialRing(F, 'x')
 p = PR.irreducible_element(k)
 while(True):
    gamma = E.random_element()
    if gamma not in F:
        break
 # gamma = PR('x^3+x')
 # print('0b'+ ''.join(map(str, gamma.coefficients(sparse=False)[::-1])))
 eqs = [PR(gamma)^i % p for i in range(k+1)]
 for eq in eqs:
    print(eq)
 print()
 eqs = list(map(lambda eq: eq.coefficients(sparse=False) + [0]*(k-eq.degree()-1), eqs))
 for eq in eqs:
    print(eq)
 print()
 eqs = matrix(eqs[::-1])
 print(eqs)
 print()
 eqs = eqs.transpose()
 print(eqs)
 print()
 rref = eqs.rref()
 print(rref)
 irrpol = PR(rref[:,-1].list() + [1])
 print(irrpol)
 print(irrpol.is_irreducible())
 print()
 # manual rref
 def calc_rref_Z2(A, m, n):
    """Calculate the reduced row echelon form of a (mxn)-matrix"""
    A = copy(A)
    # calculate row echelon form
    # https://en.wikipedia.org/wiki/Gaussian_elimination#Pseudocode
    h = 0 # Initialization of the pivot row
    k = 0 # Initialization of the pivot column
    while h < m and k < n:
        # Find the k-th pivot:
        i_max = -1
        for i in range(h, m):
            if A[i,k] == 1:
                i_max = i
                break
        if i_max == -1:
            # No pivot in this column, pass to next column
            k += 1
        else:
            tmp = A[i_max, :]
            A[i_max, :] = A[h, :]
            A[h, :] = tmp
            # Do for all rows below pivot:
            for i in range(h+1, m):
                f = A[i][k];
                if f == 0:
                    continue;
                A[i, k] = 0;
                for j in range(k+1, n):
                    A[i, j] = A[i, j] - A[h, j]
            # Increase pivot row and column
            h += 1
            k += 1
    # perform back substitution
    for i in range(1, m):
        for j in range(i):
            if A[j, i] == 1:
                A[j, :] -= A[i, :]
    return A
 print('Manual RREF:\n')
 rref = calc_rref_Z2(eqs, k, k+1) # cols = rows+1, since we transposed the matrix
 print(rref)
 print()
 irrpol = PR(rref[:,-1].list() + [1])
 print(irrpol)
 print(irrpol.is_irreducible())
 print()
 print('0b'+ ''.join(map(str, irrpol.coefficients(sparse=False)[::-1])))
--- a/V1/multiply_polynomials_modulo_polynomial.sage
+++ b/V1/multiply_polynomials_modulo_polynomial.sage
@ -0,0 +1,68 @@
 import math
 k = 31
 F = GF(2)
 var = 'x'
 PR = PolynomialRing(F, var)
 p = PR.irreducible_element(k)
 gamma = PR.random_element(k)
 exp = 10
 target = gamma^exp % p
 def polynomial_power_in_Z2(q, exp, p, var):
    if exp == 0:
        return 1
    if q.degree() == p.degree():
        q += p
    res = q
    for i in range(2, exp+1):
        res = multiply_polynomials_in_Z2(res, q, p, var)
    return res
 def polynomial_power_in_Z2_V2(q, exp, p, var):
    if exp == 0:
        return 1
    if q.degree() == p.degree():
        q += p
    log2deg = math.floor(math.log2(exp)) + 1
    arr = [0]*log2deg
    arr[0] = q
    for i in range(1, log2deg):
        arr[i] = multiply_polynomials_in_Z2(arr[i-1], arr[i-1], p, var)
    res = PR(1)
    for i, b in enumerate(bin(exp)[:1:-1]):
        if b == '1':
            res = multiply_polynomials_in_Z2(res, arr[i], p, var)
    return res
 def multiply_polynomials_in_Z2(q1, q2, p, var):
    if q1.degree() > p.degree():
        raise ValueError('Unsupported!')
    if q1.degree() == p.degree():
        q1 += p
    arr = [0]*(q2.degree()+1)
    arr[0] = q1
    for i in range(1, q2.degree()+1):
        arr[i] = arr[i-1]*PR(var)
        if arr[i].degree() == p.degree():
            arr[i] += p
    return sum(arr[i] for i in q2.exponents())
 print(target)
 res = polynomial_power_in_Z2(gamma, exp, p, var)
 print(res)
 res = polynomial_power_in_Z2_V2(gamma, exp, p, var)
 print(res)
--- a/V1/simple_string_matching
+++ b/V1/simple_string_matching
--- a/V1/simple_string_matching.cpp
+++ b/V1/simple_string_matching.cpp
@ -0,0 +1,65 @@
 /* #define NDEBUG */
 #include "Rabin_fingerprint.hpp"
 #include "general_library.hpp"
 #include <iostream>
 #include <stdint.h>
 #include <math.h>
 #include <string>
 #include <fstream>
 void print_match (size_t index, size_t length, std::string &T) {
    std::cout << "Match found at index " << index << " with the text \"";
    for (size_t i = 0; i < length; i++)
        std::cout << T[index + i];
    std::cout << "\"" << std::endl;
 }
 int main() {
    /* std::ifstream ifs("../books/the_complete_works_of_william_shakespeare.txt"); */
    std::ifstream ifs("../books/genji_monogatari_english.txt");
    std::string T( (std::istreambuf_iterator<char>(ifs) ),
                    (std::istreambuf_iterator<char>() ) );
    /* std::string T = "Hello, this is my test string averylongword is a necessary word to exceed the 32 bit window."; */
    // Test without the modulo polynomial - and two matches
    std::string P = "word";
    // Test with the modulo polynomial
    /* std::string P = "averylongword"; */
    std::cout << "Searching for pattern:" << std::endl;
    std::cout << "    " << P << std::endl;
    /* std::cout << "in text:" << std::endl; */
    /* std::cout << "    " << T << std::endl; */
    std::cout << std::endl;
    /* uint32_t polynomial = pow(2, 30) + pow(2, 2) + 1; // x^31 + x^3 + 1 */
    uint32_t polynomial = get_random_irreducible_polynomial_in_Z2(31);
    /* uint32_t polynomial = 0b11010011100100000111101011110111; */
    // Test without the modulo polynomial
    size_t window_size_in_bits = P.length()*8;
    // Hash the pattern
    Rabin_fingerprint fP(polynomial, window_size_in_bits);
    for (char c : P)
        fP.push_char(c);
    // Hash the text
    Rabin_fingerprint fT(polynomial, window_size_in_bits);
    for (size_t i = 0; i < P.length(); i++)
        fT.push_char(T[i]);
    if (fT.get_fingerprint() == fP.get_fingerprint())
        print_match(0, P.length(), T);
    for (size_t i = P.length(); i < T.length(); i++) {
        fT.slide_char(T[i], T[i-P.length()]);
        if (fT.get_fingerprint() == fP.get_fingerprint())
            print_match(i-P.length()+1, P.length(), T);
    }
    std::cout << std::endl;
    std::cout << "Done!" << std::endl;
    return EXIT_SUCCESS;
 }
--- a/V1/test_rabin_fingerprint.sage
+++ b/V1/test_rabin_fingerprint.sage
@ -0,0 +1,97 @@
 from random import randint
 F = GF(2)
 PR = PolynomialRing(F, 'x')
 k = 31
 P = PR.irreducible_element(k)
 m = 100
 # Test the calculation for moving the left edge of the sliding window
 for _ in range(1):
    q = tuple(randint(0, 1) for _ in range(m))
    for i in range(1, m+1):
        for j in range(i+1, m+1):
            assert (PR(q[:i]) % P) == (PR(q) % P) - (PR(f'x^{i}')*PR(q[i:]) % P)
 # Moving the right side of the window is as described in the Rabin Fingerprint article
 # Next step (TODO)
 # pattern     = (1,0,1,1,1,1,0,1,1,0,1,0,1,0,1,1,1,1,1,0,0,1,0,0,0,1)
 # period      = (1,0,1,1,1,1,0,1,1,0,1,0,1,0,1,1,1,1,1,0,0,1,0,0,0)
 # m           = len(pattern)
 # s_period    = tuple(list(period)+[0]*(m-len(period)))
 # pattern_1   = (1)
 # period_1    = (1)
 # s_period_1  = tuple(list(period_1)+[0]*(m-len(period_1)))
 # pattern_2   = (1,0)
 # period_2    = (1,0)
 # s_period_2  = tuple(list(period_2)+[0]*(m-len(period_2)))
 # pattern_4   = (1,0,1,1)
 # period_4    = (1,0,1)
 # s_period_4  = tuple(list(period_4)+[0]*(m-len(period_4)))
 # pattern_8   = (1,0,1,1,1,1,0,1)
 # period_8    = (1,0,1,1,1)
 # s_period_8  = tuple(list(period_8)+[0]*(m-len(period_8)))
 # pattern_16  = (1,0,1,1,1,1,0,1,1,0,1,0,1,0,1,1)
 # period_16   = (1,0,1,1,1,1,0,1,1,0,1,0)
 # s_period_16 = tuple(list(period_16)+[0]*(m-len(period_16)))
 # for i in range(len(pattern)-len(pattern_4)-len(period_4)):
 #     assert PR(pattern[i+len(period_4):i+len(pattern_4)+len(period_4)]) == PR(pattern[i:i+len(pattern_4)] + pattern[i+len(pattern_4):i+len(pattern_4)+len(period_4)]) - PR(s_period_4)
    # assert PR(pattern[i+len(period_4):i+len(pattern_4)+len(period_4)]) == pattern[i-len(period_4):i+len(pattern_4)-len(period_4)]+pattern[i+len(pattern_4)-len(period_4):i+len(pattern_4)-len(period_4)] - PR(s_period_4)
 # Does the bits of a prime number correspond to the coefficients of an irreducible polynomial?
 k = 31
 reducible = 0
 irreducible = 0
 for p in Primes()[200000000:200010000]:#[100000:100000]:
 # for p in range(2147483648,2147483648+10000):
    poly = PR(tuple(bin(p)[2:][::-1]))
    # print(f'{poly.degree()}')
    if poly.degree() > k:
        break
    if poly.degree() != k:
        continue
    irr = poly.is_irreducible()
    # print(f'The polynomial {poly}, corresponding to the prime {p}, being an irreducible polynomial is {irr}.')
    if irr:
        irreducible += 1
    else:
        reducible += 1
 print(f'{irreducible}/{reducible+irreducible} of the primes correspond to irreducible polynomials. That is {float(irreducible/(reducible+irreducible))*100}%')
 progress = 0
 the_same = 0
 different = 0
 for p in Primes()[200000000:200010000]:
    progress += 1
    print(f'\r{progress}/10000', end='')
    p_poly = PR(tuple(bin(p)[2:][::-1]))
    if not p_poly.is_irreducible():
        continue
    # i = p + randint(1,2**29)
    i = p + randint(1,p-1)
    # print(f'{i}, {p}, {2*p}, {i%p}')
    i_poly = PR(tuple(bin(i)[2:][::-1]))
    i_mod_p = i % p
    i_mod_p_poly = PR(tuple(bin(i_mod_p)[2:][::-1]))
    # print(f'i_poly: {i_poly}')
    # print(f'p_poly: {p_poly}')
    # print(f'i_mod_p_poly: {i_mod_p_poly}')
    if i_mod_p_poly == i_poly % p_poly:
        the_same += 1
    else:
        different += 1
    # if not i_mod_p_poly == i_poly - (p_poly - PR(f'x^{p_poly.degree()}')):
    # if not i_mod_p_poly == i_poly % p_poly:
    #     print()
    #     print('ERROR')
    #     print(i_mod_p_poly)
    #     # print(i_poly - (p_poly - PR(f'x^{p_poly.degree()}')))
    #     print(i_poly % p_poly)
    #     break
    # assert i_mod_p_poly == i_poly - (p_poly - PR(f'x^{p_poly.degree()}'))
 print()
 print(f'{the_same}/{the_same+different} are the same as if we did polynomial calculations. This is {float(the_same/(the_same+different))*100}%')
--- a/books/genji_monogatari_english.txt
+++ b/books/genji_monogatari_english.txt
--- a/books/the_complete_works_of_william_shakespeare.txt
+++ b/books/the_complete_works_of_william_shakespeare.txt
--- a/compare_fingerprint_false_positive_probabilities.sage
+++ b/compare_fingerprint_false_positive_probabilities.sage
@ -0,0 +1,73 @@
 # Rabin fingerprint: k > lg(n*m/e), e is the upper bound on the error probability
 # Karp-Rabin fingerprint: <= pi(n(n-m+1))/pi(M)
 # 32-bit
 M = 2**32-1
 k = 31
 # 16-bit
 # M = 2**16-1
 # k = 13
 def fpi(a):
    p = Primes()
    a_next = p.next(a)
    i = 0
    jump = 1
    lastdirection = -2
    while(True):
        print(f'{jump:010d}', end='\r')
        # print(f'{i}, {jump}')
        val = p.unrank(i)
        if val == a_next:
            return i # i-1, is the value we search for, but we count from 0, so i is correct
        elif val > a_next:
            if lastdirection == 2:
                # print('mul')
                lastdirection -= 1
                jump *= 2
            else:
                # print('div')
                jump //= 2
            lastdirection += 1
            # print(jump)
            i -= jump
        else:
            if lastdirection == -2:
                # print('mul')
                lastdirection += 1
                jump *= 2
            else:
                # print('div')
                jump //= 2
            lastdirection -= 1
            i += jump
 # Rabin fingerprint
 # k = lg(n*m/e) <=>
 # 2^k = n*m/e <=>
 # 2^k/(n*m) = 1/e <=>
 # n*m/(2^k) = e
 # Karp-Rabin fingerprint
 # e = pi(n(n-m+1))/pi(M)
 # print(pi(2**32-1))
 # e_rabin = n*m/(2^k)
 piM = fpi(M)
 for m in [1, 10, 100, 1000, 10000, 100000, 1000000, 10000000]:
    for n in [10, 100, 1000, 10000, 100000, 1000000, 10000000, 100000000]:
        if m>=n:
            continue
        print(f'(n, m) = ({n}, {m})')
        e_rabin = n*m/(2**k)
        print(f'Rabin: {float(e_rabin):.2e}')
        e_karpr = fpi(n*(n-m+1))/piM
        print(f'KarpR: {float(e_karpr):.2e}')
        print()
        print(f'{e_karpr} >= 1 is {e_karpr >= 1} | {e_rabin} >= 1 is {e_rabin >= 1}')
        if float(e_karpr) >= 1 or float(e_rabin) >= 1:
            break
--- a/ex53.cpp
+++ b/ex53.cpp
@ -0,0 +1,175 @@
 /* #define NDEBUG */
 #include "hash_table.hpp"
 #include "hashing_algorithms.hpp"
 #include <stdlib.h>
 #include <stdio.h>
 #include <string.h>
 #include <chrono>
 #include <iostream>
 #include <bitset>
 #include <fstream>
 #include <ctype.h>
 #include <vector>
 #include <assert.h>
 using namespace std;
 const int max_string_length = 256;
 const int D = (max_string_length+7) >> 3; // D = ceil(max_string_length/size(char))
 My_string * read_word(const char * book, size_t * reading_progress);
 int main() {
    const clock_t clock_before_seed = clock();
    // load seed generated by random.org
    string filename = "random_org_16_bit_numbers.txt";
    std::ifstream seed_file(filename);
    uint16_t seed_part;
    uint16_t seed_parts[D << 2];
    size_t count = 0;
    while (seed_file >> seed_part) {
        seed_parts[count] = seed_part;
        count++;
        if (count == D << 2)
            break; // the seed is large enough for the max_string_length
    }
    if (count != D << 2) {
        cout << "The current seed is not large enough. Please extend it by appending the numbers at https://www.random.org/integers/?num=10000&min=0&max=65535&col=1&base=10&format=plain&rnd=new." << endl;
        return EXIT_SUCCESS;
    }
    // Get 64 bit seed from 16 bit seed
    uint64_t seed[D];
    memcpy(seed, seed_parts, D*sizeof(seed[0]));
    const clock_t clock_before_hash_table = clock();
    size_t l = 1; // initially, hash to a table of up to 1024 distinct words (2^10)
    Hash_table ht = Hash_table(new Hash_function(seed, multiply_shift_string, l, D));
    const clock_t clock_before_loading_book = clock();
    // choose a book
    /* std::ifstream ifs("genji_monogatari_english.txt"); */
    /* std::ifstream ifs("Child_of_Light.txt"); */
    /* std::ifstream ifs("the_adventures_of_sherlock_holmes.txt"); */
    /* std::ifstream ifs("dracula.txt"); */
    std::ifstream ifs("the_complete_works_of_william_shakespeare.txt");
    string book_string( (std::istreambuf_iterator<char>(ifs) ),
                    (std::istreambuf_iterator<char>() ) );
    const char * book = book_string.c_str();
    const size_t book_length = book_string.size();
    const clock_t clock_before_reading = clock();
    std::vector<My_string *> words;
    size_t reading_progress = 0;
    while (reading_progress < book_length-1) { // book_length includes '\0' which reading_progress avoids
        My_string * word = read_word(book, &reading_progress);
        if (word->size > 0)
            words.push_back(word);
    }
    const clock_t clock_after_reading = clock();
    size_t count_words = 0;
    for (My_string * word : words) {
        count_words++;
        ht.hash(word);
        if (ht.is_time_for_rehash()) {
            l++; // double the universe which we hashes to
            ht.rehash(new Hash_function(seed, multiply_shift_string, l, D));
        }
    }
    const clock_t clock_after_hashing = clock();
    Hash_function hf = Hash_function(seed, multiply_shift_string, 10, D);
    const clock_t clock_after_init_hash_function = clock();
    uint64_t hashed_value = 0;
    for (My_string * word : words) {
        /* hf.hash(word); */
        hashed_value += hf.hash(word);
    }
    const clock_t clock_after_hashing_only = clock();
    cout << "Sum of the hashed values (after overflow): " << hashed_value << endl;
    cout << "Nr of words: " << count_words << endl;
    cout << "Distinct words: " << ht.get_distict_words() << endl;
    cout << "Time: Load seed:    " << float( clock_before_hash_table - clock_before_seed ) / CLOCKS_PER_SEC << endl;
    cout << "Time: Init hash table:    " << float( clock_before_loading_book - clock_before_hash_table ) / CLOCKS_PER_SEC << endl;
    cout << "Time: Load book:    " << float( clock_before_reading - clock_before_loading_book ) / CLOCKS_PER_SEC << endl;
    cout << "Time: Read:    " << float( clock_after_reading - clock_before_reading ) / CLOCKS_PER_SEC << endl;
    cout << "Time: Hash & Table:    " << float( clock_after_hashing - clock_after_reading ) / CLOCKS_PER_SEC << endl;
    cout << "Time: Total:    " << float( clock_after_hashing - clock_before_seed ) / CLOCKS_PER_SEC << endl;
    cout << "Time: Init hash function:    " << float( clock_after_init_hash_function - clock_after_hashing ) / CLOCKS_PER_SEC << endl;
    cout << "Time: Hash, no table:    " << float( clock_after_hashing_only - clock_after_init_hash_function ) / CLOCKS_PER_SEC << endl;
    for (My_string * word : words)
        delete word;
    // BONUS: Polynomium hashing
    uint32_t result_un;
    size_t book_as_integer_length = (book_length+3)>>2; // ceil(book_length/4)
    uint32_t book_as_integer[book_as_integer_length];
    book_as_integer[book_as_integer_length-1] = 0;
    memcpy(book_as_integer, book, book_length*sizeof(book[0]));
    uint32_t a[3] = {12313,2212312,123332};
    uint32_t b[3] = {5345,213213,123123};
    uint32_t c[3] = {3231,213144,450022};
    const clock_t begin_time_pol = clock();
    result_un = polynomial_vector(book_as_integer, a, b, c, book_as_integer_length >> 2, 32);
    const clock_t end_time_pol = clock();
    cout << "polynomium hash function time:                     " << float( end_time_pol - begin_time_pol ) / CLOCKS_PER_SEC << endl;
    cout << "Result: " << result_un << endl;
    const clock_t begin_time_pol_tun = clock();
    result_un = polynomial_vector_tuned(book_as_integer, a, b, c, book_as_integer_length >> 2, 32, seed);
    const clock_t end_time_pol_tun = clock();
    cout << "tuned polynomium hash function time:                     " << float( end_time_pol_tun - begin_time_pol_tun ) / CLOCKS_PER_SEC << endl;
    cout << "Result: " << result_un << endl;
    return EXIT_SUCCESS;
 }
 My_string * read_word(const char * book, size_t * reading_progress) {
    bool word_started = false;
    char word[max_string_length];
    size_t word_length = 0;
    char c;
    while (book[*reading_progress+1] != '\0') {
        (*reading_progress)++;
        c = book[*reading_progress];
        if (word_started) {
            if (isalnum(c)) {
                if (word_length != max_string_length) { // crop words longer than the max_string_length
                    word[word_length] = tolower(c);
                    word_length++;
                }
            } else {
                return new My_string(word, word_length);
            }
        } else if (isalnum(c)) {
            word_started = true;
            word[word_length] = c;
            word_length++;
        }
    }
    return new My_string(word, word_length);
 }
--- a/fagprojekt_code/Makefile
+++ b/fagprojekt_code/Makefile
@ -0,0 +1,48 @@
 CC = cc # C compiler
 # cc and gcc is the same
 CXX = c++ # C++ compiler
 # c++
 # g++
 # clang++
 CPPFLAGS = # preprocessor flags
 CFLAGS = -Wall -Wfloat-equal -std=c99 -O0 -mtune=native -funroll-loops $(OPT) # C compiler flags
 # -Wall: Warnings all
 # -Wfloat-equal: Warn if comparing floats with ==
 # -OX: Optimization level -O0 (none, default), -O1, -O2, -O3 (most, may increase file size), -Os (decrease file size), -ffast-math
 # -mtune: Tune for specific/generic CPU
 # -funrool-loops: Unroll loops when compiling
 # -fopenmp: Enable OpenMP (When running, set the environmental variable OMP_NUM_THREADS)
 # $(OPT): Passes any parameter given when calling make with 'make OPT=...'
 CXXFLAGS = -Wall -std=c++17 -O0 # C++ compiler flags
 LDFLAGS = # linker flags
 LDLIBS = # library flags
 # -lm (for <math.h>)
 # -lblas (BASIC LINEAR ALGEBRA SUBPROGRAMS)
 # -lcblas (for <cblas.h>)
 # -lopenblas (NOT INSTALLED; blas and cblas in one; conflicts with blas and cblas)
 # -llapack (LAPACKE)
 # -llapacke (LAPACK) NOTE: The order of "-llapacke -llapack -lblas" is very important
 #LINK.o = $(CXX) $(LDFLAGS) # use CXX for linking
 # What to do when making ex1.c
 #ex1: datasize1.o
 # What to do when making ex1.cpp (C++ style)
 #ex1: datasize1.cpp
 ex53: hashed_string.cpp hash_table.cpp hashing_algorithms.cpp
 eq17: hashed_string.cpp hash_table.cpp hashing_algorithms.cpp
 # Tell the compiler that 'clean' isn't referring to a file
 #.PHONY: clean
 # A make target that cleans (by deleting files)
 clean:
 	$(RM) fast_modulo *.o
 	$(RM) eq17 *.o
 	$(RM) ex53 *.o
 	$(RM) hashed_string *.o
 	$(RM) hash_table *.o
 fast_modulo:
--- a/fagprojekt_code/ascii_to_bits.cpp
+++ b/fagprojekt_code/ascii_to_bits.cpp
@ -0,0 +1,57 @@
 #include <stdlib.h>
 /* #include <chrono> */
 #include <iostream>
 /* #include <stdio.h> */
 /* #include <cmath> */
 /* #include <string.h> */
 /* #include <stdint.h> */
 #include <bitset>
 #include <fstream>
 using namespace std;
 int main() {
    string s = "test";
    const char * c = s.c_str();
    for (size_t i = 0; i < s.size(); i++) {
        cout << std::bitset<__CHAR_BIT__>( c[i] ) << " ";
    }
    cout << endl;
    std::ifstream ifs("genji_monogatari_english.txt");
    string genji( (std::istreambuf_iterator<char>(ifs) ),
                       (std::istreambuf_iterator<char>()    ) );
    const char * c2 = genji.c_str();
    for (size_t i = 0; i < 1000; i++) {
        /* cout << std::bitset<__CHAR_BIT__>( c2[i] ) << " "; */
        cout << c2[i];
    }
    cout << endl;
    /* cout << genji.size() << endl; */
    /* unsigned char bitgenji[genji.size()]; */
    /* for (size_t i = 0; i < genji.size(); ++i) */
    /* { */
    /*     bitgenji[i] = static_cast<unsigned char>( bitset<8>(genji[i]).to_ulong() ); */
    /* } */
    /* for (size_t i = 0; i < 4; ++i) */
    /* { */
    /*     cout << (bitset<8>) bitgenji[i] << endl; */
    /*     cout << (unsigned int) bitgenji[i] << endl; */
    /* } */
    /* for (size_t i = 0; i < 100; ++i) */
    /* { */
    /*     cout <<  bitgenji[i]; */
    /* } */
    /* cout << endl; */
    return EXIT_SUCCESS;
 }
--- a/fagprojekt_code/eq17.cpp
+++ b/fagprojekt_code/eq17.cpp
@ -0,0 +1,138 @@
 #include "hashing_algorithms.hpp"
 #include <stdlib.h>
 #include <chrono>
 #include <iostream>
 /* #include <stdio.h> */
 #include <cmath>
 /* #include <string.h> */
 /* #include <stdint.h> */
 using namespace std;
 int main() {
    unsigned int M = 9299983;
    unsigned int m = 3226097;
    unsigned int result;
    const clock_t begin_time1 = clock();
    for (unsigned int y = 0; y < M; y++) {
        result = (unsigned int) ((float)(y*m)/(float)M);
    }
    const clock_t end_time1 = clock();
    cout << "Naive time:                     " << float( end_time1 - begin_time1 ) / CLOCKS_PER_SEC << endl;
    cout << "Result: " << result << endl;
    const clock_t begin_time2 = clock();
    for (unsigned int y = 0; y < M; y += 10) {
        result = (unsigned int) ((float)(y*m)/(float)M);
        result = (unsigned int) ((float)((y+1)*m)/(float)M);
        result = (unsigned int) ((float)((y+2)*m)/(float)M);
        result = (unsigned int) ((float)((y+3)*m)/(float)M);
        result = (unsigned int) ((float)((y+4)*m)/(float)M);
        result = (unsigned int) ((float)((y+5)*m)/(float)M);
        result = (unsigned int) ((float)((y+6)*m)/(float)M);
        result = (unsigned int) ((float)((y+7)*m)/(float)M);
        result = (unsigned int) ((float)((y+8)*m)/(float)M);
        result = (unsigned int) ((float)((y+9)*m)/(float)M);
    }
    const clock_t end_time2 = clock();
    cout << "Naive time (unrolled):          " << float( end_time2 - begin_time2 ) / CLOCKS_PER_SEC << endl;
    cout << "Result: " << result << endl;
    const clock_t begin_time6 = clock();
    for (unsigned int y = 0; y < M; y++) {
        result = y*m/M;
    }
    const clock_t end_time6 = clock();
    cout << "Naive time (no-typecasting):    " << float( end_time6 - begin_time6 ) / CLOCKS_PER_SEC << endl;
    cout << "Result: " << result << endl;
    const clock_t begin_time7 = clock();
    for (unsigned int y = 0; y < M; y += 10) {
        result = y*m/M;
        result = ((y+1)*m)/M;
        result = ((y+2)*m)/M;
        result = ((y+3)*m)/M;
        result = ((y+4)*m)/M;
        result = ((y+5)*m)/M;
        result = ((y+6)*m)/M;
        result = ((y+7)*m)/M;
        result = ((y+8)*m)/M;
        result = ((y+9)*m)/M;
    }
    const clock_t end_time7 = clock();
    cout << "Naive time (no-typecasting, unrolled):    " << float( end_time7 - begin_time7 ) / CLOCKS_PER_SEC << endl;
    cout << "Result: " << result << endl;
    float mM = (float) m/(float) M;
    const clock_t begin_time3 = clock();
    for (unsigned int y = 0; y < M; y ++) {
        result = (unsigned int) (((float) y)*mM);
    }
    const clock_t end_time3 = clock();
    cout << "Precalculation time:            " << float( end_time3 - begin_time3 ) / CLOCKS_PER_SEC << endl;
    cout << "Result: " << result << endl;
    const clock_t begin_time4 = clock();
    for (unsigned int y = 0; y < M; y += 10) {
        result = (unsigned int) ((float) y*mM);
        result = (unsigned int) ((float) (y+1)*mM);
        result = (unsigned int) ((float) (y+2)*mM);
        result = (unsigned int) ((float) (y+3)*mM);
        result = (unsigned int) ((float) (y+4)*mM);
        result = (unsigned int) ((float) (y+5)*mM);
        result = (unsigned int) ((float) (y+6)*mM);
        result = (unsigned int) ((float) (y+7)*mM);
        result = (unsigned int) ((float) (y+8)*mM);
        result = (unsigned int) ((float) (y+9)*mM);
    }
    const clock_t end_time4 = clock();
    cout << "Precalculation time (unrolled): " << float( end_time4 - begin_time4 ) / CLOCKS_PER_SEC << endl;
    cout << "Result: " << result << endl;
    /* for (unsigned int y = 0; y < M; y++){ */
    /*     // Very often, differentiating by multiplying first or dividing first results in the result being off by 1 from each other */
    /*     /1* if (abs((int) ((float)y*((float)m/(float)M)) - (int) ((float) y*mM)) >= 1) *1/ */
    /*     /1*     cout <<(unsigned int) ((float)y*(float)m/(float)M) << " != " << (unsigned int) ((float) y*mM) << endl; *1/ */
    /*     /1* if (abs((int)(y*m/M - (y*m)/M)) >= 1) *1/ */
    /*     /1*     cout <<y*m/M << " != " << (y*m)/M << endl; *1/ */
    /*     /1* if (abs((int)(((float)y*((float)m/(float)M)) - (y*m)/M)) >= 1) *1/ */
    /*     /1*     cout <<(unsigned int)((float)y*((float)m/(float)M)) << " != " << (y*m)/M << endl; *1/ */
    /*     if (abs((int)(((float)y*(float)m)/(float)M - (unsigned int)y*(unsigned int)m/(unsigned int)M)) >= 1) */
    /*         cout <<((float)(y*m)/(float)M << " != " << (unsigned int)y*(unsigned int)m/(unsigned int)M << endl; */
    /* } */
    // The non-precalculation model is susceptible to overflow
    /* for (unsigned int y = 0; y < 40; y++) { */
    /*     cout << "y: " << y << ", "; */
    /*     cout << "m: " << m << ", "; */
    /*     cout << "M: " << M << ", "; */
    /*     cout << "mM: " << mM << ", "; */
    /*     cout << "y*m: " << y*m << ", "; */
    /*     cout << "(y*m)/M: " << (y*m)/M << ", "; */
    /*     cout << "y*(m/M): " << y*(m/M) << ", "; */
    /*     cout << y*m/M; */
    /*     cout << " != "; */
    /*     cout << (unsigned int) ((float)(y*m)/(float)M); */
    /*     cout << " != "; */
    /*     cout << (unsigned int) ((float)y*(float)m/(float)M); */
    /*     cout << " != "; */
    /*     cout << (unsigned int) ((float) y*mM); */
    /*     cout << endl; */
    /* } */
    uint64_t result_un;
    uint64_t p = pow(2, 61)-1;
    uint64_t m_un = pow(2, 20)+2;
    const clock_t begin_time_un = clock();
    for (uint64_t y = 0; y < 100000000; y++) {
        /* result_un = multiply_mod_prime_mersenne_overflow(y, m, M, p, m_un); */
        result_un = multiply_shift_strongly_universal(y, p, m_un, 20);
    }
    const clock_t end_time_un = clock();
    cout << "Unrelated hash function time:                     " << float( end_time_un - begin_time_un ) / CLOCKS_PER_SEC << endl;
    cout << "Result: " << result_un << endl;
    return EXIT_SUCCESS;
 }
--- a/fagprojekt_code/ex53.cpp
+++ b/fagprojekt_code/ex53.cpp
@ -0,0 +1,175 @@
 /* #define NDEBUG */
 #include "hash_table.hpp"
 #include "hashing_algorithms.hpp"
 #include <stdlib.h>
 #include <stdio.h>
 #include <string.h>
 #include <chrono>
 #include <iostream>
 #include <bitset>
 #include <fstream>
 #include <ctype.h>
 #include <vector>
 #include <assert.h>
 using namespace std;
 const int max_string_length = 256;
 const int D = (max_string_length+7) >> 3; // D = ceil(max_string_length/size(char))
 My_string * read_word(const char * book, size_t * reading_progress);
 int main() {
    const clock_t clock_before_seed = clock();
    // load seed generated by random.org
    string filename = "random_org_16_bit_numbers.txt";
    std::ifstream seed_file(filename);
    uint16_t seed_part;
    uint16_t seed_parts[D << 2];
    size_t count = 0;
    while (seed_file >> seed_part) {
        seed_parts[count] = seed_part;
        count++;
        if (count == D << 2)
            break; // the seed is large enough for the max_string_length
    }
    if (count != D << 2) {
        cout << "The current seed is not large enough. Please extend it by appending the numbers at https://www.random.org/integers/?num=10000&min=0&max=65535&col=1&base=10&format=plain&rnd=new." << endl;
        return EXIT_SUCCESS;
    }
    // Get 64 bit seed from 16 bit seed
    uint64_t seed[D];
    memcpy(seed, seed_parts, D*sizeof(seed[0]));
    const clock_t clock_before_hash_table = clock();
    size_t l = 1; // initially, hash to a table of up to 1024 distinct words (2^10)
    Hash_table ht = Hash_table(new Hash_function(seed, multiply_shift_string, l, D));
    const clock_t clock_before_loading_book = clock();
    // choose a book
    /* std::ifstream ifs("genji_monogatari_english.txt"); */
    /* std::ifstream ifs("Child_of_Light.txt"); */
    /* std::ifstream ifs("the_adventures_of_sherlock_holmes.txt"); */
    /* std::ifstream ifs("dracula.txt"); */
    std::ifstream ifs("the_complete_works_of_william_shakespeare.txt");
    string book_string( (std::istreambuf_iterator<char>(ifs) ),
                    (std::istreambuf_iterator<char>() ) );
    const char * book = book_string.c_str();
    const size_t book_length = book_string.size();
    const clock_t clock_before_reading = clock();
    std::vector<My_string *> words;
    size_t reading_progress = 0;
    while (reading_progress < book_length-1) { // book_length includes '\0' which reading_progress avoids
        My_string * word = read_word(book, &reading_progress);
        if (word->size > 0)
            words.push_back(word);
    }
    const clock_t clock_after_reading = clock();
    size_t count_words = 0;
    for (My_string * word : words) {
        count_words++;
        ht.hash(word);
        if (ht.is_time_for_rehash()) {
            l++; // double the universe which we hashes to
            ht.rehash(new Hash_function(seed, multiply_shift_string, l, D));
        }
    }
    const clock_t clock_after_hashing = clock();
    Hash_function hf = Hash_function(seed, multiply_shift_string, 10, D);
    const clock_t clock_after_init_hash_function = clock();
    uint64_t hashed_value = 0;
    for (My_string * word : words) {
        /* hf.hash(word); */
        hashed_value += hf.hash(word);
    }
    const clock_t clock_after_hashing_only = clock();
    cout << "Sum of the hashed values (after overflow): " << hashed_value << endl;
    cout << "Nr of words: " << count_words << endl;
    cout << "Distinct words: " << ht.get_distict_words() << endl;
    cout << "Time: Load seed:    " << float( clock_before_hash_table - clock_before_seed ) / CLOCKS_PER_SEC << endl;
    cout << "Time: Init hash table:    " << float( clock_before_loading_book - clock_before_hash_table ) / CLOCKS_PER_SEC << endl;
    cout << "Time: Load book:    " << float( clock_before_reading - clock_before_loading_book ) / CLOCKS_PER_SEC << endl;
    cout << "Time: Read:    " << float( clock_after_reading - clock_before_reading ) / CLOCKS_PER_SEC << endl;
    cout << "Time: Hash & Table:    " << float( clock_after_hashing - clock_after_reading ) / CLOCKS_PER_SEC << endl;
    cout << "Time: Total:    " << float( clock_after_hashing - clock_before_seed ) / CLOCKS_PER_SEC << endl;
    cout << "Time: Init hash function:    " << float( clock_after_init_hash_function - clock_after_hashing ) / CLOCKS_PER_SEC << endl;
    cout << "Time: Hash, no table:    " << float( clock_after_hashing_only - clock_after_init_hash_function ) / CLOCKS_PER_SEC << endl;
    for (My_string * word : words)
        delete word;
    // BONUS: Polynomium hashing
    uint32_t result_un;
    size_t book_as_integer_length = (book_length+3)>>2; // ceil(book_length/4)
    uint32_t book_as_integer[book_as_integer_length];
    book_as_integer[book_as_integer_length-1] = 0;
    memcpy(book_as_integer, book, book_length*sizeof(book[0]));
    uint32_t a[3] = {12313,2212312,123332};
    uint32_t b[3] = {5345,213213,123123};
    uint32_t c[3] = {3231,213144,450022};
    const clock_t begin_time_pol = clock();
    result_un = polynomial_vector(book_as_integer, a, b, c, book_as_integer_length >> 2, 32);
    const clock_t end_time_pol = clock();
    cout << "polynomium hash function time:                     " << float( end_time_pol - begin_time_pol ) / CLOCKS_PER_SEC << endl;
    cout << "Result: " << result_un << endl;
    const clock_t begin_time_pol_tun = clock();
    result_un = polynomial_vector_tuned(book_as_integer, a, b, c, book_as_integer_length >> 2, 32, seed);
    const clock_t end_time_pol_tun = clock();
    cout << "tuned polynomium hash function time:                     " << float( end_time_pol_tun - begin_time_pol_tun ) / CLOCKS_PER_SEC << endl;
    cout << "Result: " << result_un << endl;
    return EXIT_SUCCESS;
 }
 My_string * read_word(const char * book, size_t * reading_progress) {
    bool word_started = false;
    char word[max_string_length];
    size_t word_length = 0;
    char c;
    while (book[*reading_progress+1] != '\0') {
        (*reading_progress)++;
        c = book[*reading_progress];
        if (word_started) {
            if (isalnum(c)) {
                if (word_length != max_string_length) { // crop words longer than the max_string_length
                    word[word_length] = tolower(c);
                    word_length++;
                }
            } else {
                return new My_string(word, word_length);
            }
        } else if (isalnum(c)) {
            word_started = true;
            word[word_length] = c;
            word_length++;
        }
    }
    return new My_string(word, word_length);
 }
--- a/fagprojekt_code/fast_modulo.cpp
+++ b/fagprojekt_code/fast_modulo.cpp
@ -0,0 +1,202 @@
 #include <stdlib.h>
 #include <stdio.h>
 #include <math.h>
 #include <string.h>
 #include <stdint.h>
 void printIntInBinary(unsigned int n);
 void intToBinary(unsigned int n, char* p);
 void strrev(char* p, unsigned int len);
 unsigned int mod32BitMersenne(unsigned int x, unsigned int m);
 int main() {
    unsigned int q = 2;
    unsigned int x = pow(2, 2*q) - 1; // pow(2, 2*q) is the max value for x
    unsigned int p = pow(2, q) - 1;
    unsigned int y;
    y=(x&p)+(x>>q);
    if (y>=p) y-=p;
    printf("q = %d, x = %d, p = %d, y = %d\n", q, x, p, y);
    printf("x&p = %d, x>>q = %d\n", x&p, x>>q);
    printIntInBinary(x);
    printIntInBinary(p);
    printIntInBinary(x&p);
    printIntInBinary(x>>q);
    printf("\n");
    printIntInBinary( ((unsigned int)0b1111101111011101101<<26)>>26 );
    printIntInBinary( ((unsigned int)0b1111101111011101101<<27)>>27 );
    printIntInBinary( ((unsigned int)0B1111101111011101101<<28)>>28 );
    printIntInBinary( ((unsigned int)0B1111101111011101101<<29)>>29 );
    printIntInBinary( ((unsigned int)0B1111101111011101101<<30)>>30 );
    unsigned int a = 0b0110000000;
    unsigned int b = 0b1111111001;
    printf("\n");
    printIntInBinary(a);
    printIntInBinary(b);
    b = (b & ~0b110) | ((a & 0b110000000) >> 6);
    printIntInBinary(a);
    printIntInBinary(b);
    /* // Too general an approach */
    /* // TODO: Special case where ax+b < p < m */
    /* // ((ax+b) mod p) mod m, p=2^89-1, m=2^20 */
    /* size_t r = 89; // aka q */
    /* size_t bits = 32; */
    /* size_t remainingBits = r; */
    /* size_t lastIndex = 0; */
    /* size_t len = 4; */
    /* uint32_t data[len], tmp[len]; */
    /* // mod p, p = 2^89-1 */
    /* // x&p */
    /* for (size_t i = 0; (i+1)*bits < r; i++ ) { */
    /*     tmp[i] = data[i]&0b1111'1111'1111'1111'1111'1111'1111'1111; // 32 ones. Standard since C++14 */
    /*     remainingBits -= 32; */
    /*     lastIndex = i+1; */
    /* } */
    /* size_t shiftLen = bits-remainingBits; // TODO: Check for 1-off errors */
    /* tmp[lastIndex] = (data[lastIndex]<<shiftLen)>>shiftLen; // mod 2^remainingBits */
    /* // x>>q */
    /* /1* for (size_t i = 0; i < len; i++) { *1/ */
    /* /1* } *1/ */
    /* // mod m, m = 2^20 */
    /* unsigned int mMinusOne = 0b1111'1111'1111'1111'1111; // 20 ones. Standard since C++14 */
    /* data[len-1] = data[len-1]&mMinusOne; */
    /* // Can be optimized further */
    /* size_t len = 4; // input parameter */
    /* uint32_t data[len], tmp[len]; */
    /* //// mod p, p = 2^89-1 */
    /* // x&p */
    /* tmp[len] = data[len]&0b1111'1111'1111'1111'1111'1111'1111'1111; // 32 ones. */
    /* tmp[len] = data[len]&0b1111'1111'1111'1111'1111'1111'1111'1111; // 32 ones. */
    /* tmp[len] = data[len]&0b1'1111'1111'1111'1111'1111'1111; // remaining bits = 89-32*2 = 25 ones. */
    /* // x>>q */
    /* //// mod m, m = 2^20 */
    /* unsigned int mMinusOne = 0b1111'1111'1111'1111'1111; // 20 ones. */
    /* data[len-1] = data[len-1]&mMinusOne; */
    /* // Optimize more! */
    /* size_t len = 4; // input parameter */
    /* uint32_t data[len]; // input parameter */ 
    /* uint32_t tmp; */
    /* //// mod p, p = 2^89-1 */
    /* // x&p */
    /* tmp = data[len-1]&0b1111'1111'1111'1111'1111; // 20 ones */
    /* // x>>q */
    /* // 89 - 2*32 = 25 so */
    /* tmp = tmp + (data[len]>>5)&0b1111'1111'1111'1111'1111; // 20 ones */
    /* //// mod m, m = 2^20 */
    /* tmp = tmp&0b1111'1111'1111'1111'1111; // 20 ones = m - 1 */
    /* // clean up before output */
    /* for (size_t i = 0; i < len; i++) */
    /*     data[i] = 0; */
    /* // output */
    /* data[len-1] = tmp; */
    /* // More!!! */
    /* size_t len = 4; // input parameter */
    /* uint32_t data[len]; // input parameter */ 
    /* //// mod p, p = 2^89-1 */
    /* // x&p */
    /* data[len-1] = data[len-1]&0b1111'1111'1111'1111'1111; // 20 ones */
    /* // x>>q */
    /* // 89 - 2*32 = 25 so */
    /* data[len-1] = data[len-1] + ((data[len-3]>>5)&0b1111'1111'1111'1111'1111); // 20 ones */
    /* //// mod m, m = 2^20 */
    /* data[len-1] = data[len-1]&0b1111'1111'1111'1111'1111; // 20 ones = m - 1 */
    /* // data[len-1] is the result */
    size_t len = 4; // input parameter
    uint32_t data[len]; // input parameter 
    data[len-1] = (data[len-1] + (data[len-3]>>5))&0b1111'1111'1111'1111'1111; // 20 ones
    // data[len-1] is the result
    // Or as a function
    // void mod89mod20 (uint32_t * data, size_t len) {
    //     data[len-1] = (data[len-1] + (data[len-3]>>5))&0b1111'1111'1111'1111'1111; // 20 ones
    // }
    return EXIT_SUCCESS;
 }
 template <typename T>
 T mod (T x, T p) {
    while (x >= p)
        x -= p;
    return x;
 }
 void printIntInBinary(unsigned int n) {
    char b[100];
    intToBinary(n, b);
    printf("%5u = %10s\n", n, b);
 }
 void intToBinary(unsigned int n, char* p) {
    if (NULL == p)
        return;
    char* q = p;
    int count = 0;
    do {
        if (n % 2 == 0)
            *p = '0';
        else
            *p = '1';
        p++;
        n = n>>1;
        count++;
    } while (n > 0);
    *p = '\0';
    strrev(q, count);
 }
 void strrev(char* p, unsigned int len) {
   char tmp;
   int i, j = 0;
   i = 0;
   j = len - 1;
   while (i < j) {
      tmp = p[i];
      p[i] = p[j];
      p[j] = tmp;
      i++;
      j--;
   }
 }
--- a/fagprojekt_code/hash_table.cpp
+++ b/fagprojekt_code/hash_table.cpp
@ -0,0 +1,56 @@
 #include "hash_table.hpp"
 #include "hashed_string.hpp"
 #include <stdint.h>
 #include <string.h>
 Hash_table::Hash_table(Hash_function * hash_function) : hash_function(hash_function) {
    m = hash_function->get_m();
    words = new Hashed_string[m];
 }
 Hash_table::~Hash_table() {
    delete hash_function;
    delete[] words;
 }
 size_t Hash_table::get_distict_words() {
    return distinct_words;
 }
 void Hash_table::hash(My_string * word) {
    uint64_t hash = hash_function->hash(word);
    distinct_words += words[hash].append(new Hashed_string(word));
 }
 void Hash_table::hash(Hashed_string * hs) {
    uint64_t hash = hash_function->hash( &(hs->string) );
    distinct_words += words[hash].append(hs);
 }
 void Hash_table::rehash(Hash_function * hash_function) {
    delete this->hash_function;
    this->hash_function = hash_function;
    size_t old_m = m;
    m = this->hash_function->get_m();
    Hashed_string * old_words = this->words;
    words = new Hashed_string[m];
    distinct_words = 0; // reset, because we are hashing all the words once more
    for (size_t i = 0; i < old_m; i++) {
        Hashed_string * hs = &(old_words[i]);
        // skip the initializer Hashed_string
        while (hs->next != NULL) {
            hs = hs->next;
            hash(new Hashed_string(hs));
        }
    }
    // delete the old stuff
    delete[] old_words;
 }
--- a/fagprojekt_code/hash_table.hpp
+++ b/fagprojekt_code/hash_table.hpp
@ -0,0 +1,56 @@
 #ifndef HASH_TABLE_H
 #define HASH_TABLE_H
 #include "hashed_string.hpp"
 #include <stdint.h>
 struct Hash_function {
    private:
        uint64_t * seed;
        uint64_t(* hash_function)(const My_string *, const uint64_t *, uint64_t *, size_t);
        size_t l;
        uint64_t * x;
    public:
        Hash_function(uint64_t * seed, uint64_t(* hash_function)(const My_string *, const uint64_t *, uint64_t *, size_t), size_t l, size_t D) {
            this->seed = seed;
            this->hash_function = hash_function;
            this->l = l;
            this->x = new uint64_t[D];
        }
        ~Hash_function() {
            delete[] x;
        }
        size_t get_m() {
            return 1 << l;
        }
        uint64_t hash(const My_string * string) {
            return hash_function(string, seed, x, l);
        }
 };
 struct Hash_table {
    private:
        Hash_function * hash_function;
        Hashed_string * words;
        size_t distinct_words = 0;
        size_t m;
    public:
        Hash_table(Hash_function * hash_function);
        ~Hash_table();
        size_t get_distict_words();
        void hash(My_string * word);
        void hash(Hashed_string * hs);
        void rehash(Hash_function * hash_function);
        int is_time_for_rehash() {return distinct_words >= m;}
 };
 #endif
--- a/fagprojekt_code/hashed_string.cpp
+++ b/fagprojekt_code/hashed_string.cpp
@ -0,0 +1,78 @@
 #include "hashed_string.hpp"
 #include <stdlib.h>
 #include <stdint.h>
 #include <string>
 #include <string.h>
 #include <iostream>
 My_string::My_string(char * chars, size_t size) {
    this->size = size;
    this->chars = new char[size];
    if (size != 0) {
        memcpy(this->chars, chars, size*sizeof(this->chars[0]));
    }
 }
 My_string::~My_string() {
    delete[] chars;
 }
 bool My_string::operator==(const My_string& other)
 {
    if (size != other.size)
        return false;
    return strncmp(chars, other.chars, size) == 0;
 }
 Hashed_string::Hashed_string() : string(My_string(NULL, 0)) {
    initializer = true;
 }
 Hashed_string::Hashed_string(My_string * s) : string(My_string(s->chars, s->size)) {};
 Hashed_string::Hashed_string(Hashed_string * hs) : string(My_string(hs->string.chars, hs->string.size)), appearances(hs->appearances) {};
 Hashed_string::~Hashed_string() {
    // if you delete the initializer, delete the whole chain
    if (initializer) {
        while (next != NULL)
            next->remove(next);
    }
 }
 int Hashed_string::append(Hashed_string * new_string) {
    if (!initializer) {
        if (string == new_string->string) {
            appearances += new_string->appearances;
            return 0;
        }
    }
    if (last_element) {
        new_string->previous = this;
        next = new_string;
        last_element = false;
        return 1;
    } else {
        return next->append(new_string);
    }
 }
 void Hashed_string::remove(Hashed_string * removed_string) {
    if (initializer && last_element)
        return;
    if (string == removed_string->string) {
        if (last_element) {
            previous->last_element = true;
            previous->next = NULL;
        } else {
            previous->next = next;
            next->previous = previous;
        }
        delete this;
    } else if (!last_element)
        next->remove(removed_string);
 }
--- a/fagprojekt_code/hashed_string.hpp
+++ b/fagprojekt_code/hashed_string.hpp
@ -0,0 +1,34 @@
 #ifndef HASHED_OBJECT_H
 #define HASHED_OBJECT_H
 #include <string>
 struct My_string {
    char * chars;
    size_t size;
    My_string(char *, size_t);
    ~My_string();
    bool operator==(const My_string& other);
 };
 struct Hashed_string {
    Hashed_string * next = NULL;
    Hashed_string * previous = NULL;
    bool last_element = true;
    bool initializer = false; // signal the object to act as the "link" between the its reference and the linked list of hashed elemenets. This instance DOES NOT represent a hashed value.
    My_string string;
    unsigned int appearances = 1;
    Hashed_string();
    Hashed_string(My_string * s);
    Hashed_string(Hashed_string * hs);
    ~Hashed_string();
    int append(Hashed_string * new_string); // returns 1 if the word was new and 0 otherwise.
    void remove(Hashed_string * removed_string);
 };
 #endif
--- a/fagprojekt_code/hashing_algorithms.cpp
+++ b/fagprojekt_code/hashing_algorithms.cpp
@ -0,0 +1,294 @@
 #include "hashing_algorithms.hpp"
 #include "hashed_string.hpp"
 #include <string.h>
 // p is prime. p > m > 1, p > a > 0, p > b >= 0
 uint64_t multiply_mod_prime(uint64_t x, uint64_t a, uint64_t b, uint64_t p, uint64_t m) {
    return ((a*x+b) % p) % m;
 }
 // p is a Mersenne prime. p > m > 1, p > a > 0, p > b >= 0
 uint64_t multiply_mod_prime_mersenne(uint64_t x, uint64_t a, uint64_t b, uint64_t p, uint64_t m) {
    uint64_t y = a*x+b;
    y = (y&p)+(y>>p);
    if (y>=p) y-=p;
    return y % m;
 }
 // p is a Mersenne prime. m=2^q. p > m > 1, p > a > 0, p > b >= 0
 uint64_t multiply_mod_prime_mersenne_overflow(uint64_t x, uint64_t a, uint64_t b, uint64_t p, char q) {
    uint64_t y = a*x+b;
    y = (y&p)+(y>>p);
    if (y>=p) y-=p;
    return y & ~( ( ~(uint64_t)0 ) << q); // OBS: Behaviour undefined for shifting n-bit integers n times
 }
 // p is a Mersenne prime. m=2^q. p > m > 1, p > a > 0
 uint64_t multiply_mod_prime_mersenne_overflow_no_b(uint64_t x, uint64_t a, uint64_t p, char q) {
    uint64_t y = a*x;
    y = (y&p)+(y>>p);
    if (y>=p) y-=p;
    return y & ~( ( ~(uint64_t)0 ) << q); // OBS: Behaviour undefined for shifting n-bit integers n times
 }
 // p=2^89-1 is a Mersenne prime. m=2^l. 32 >= l > 0. p > a > 0, p > b >= 0. x is an 64 bit integer. We assume x, a, and b are arrays of 32 bit integers.
 uint32_t multiply_mod_prime_mersenne_overflow_high_bitcount(uint32_t * x, uint32_t * a, uint32_t * b, char l) {
    // x is a 64 bit integer given as a 2 long array of 32 bit integers
    // a is a 89 bit integer given as a 3 long array of 32 bit integers
    // b is a 89 bit integer given as a 3 long array of 32 bit integers
    // ax: array to hold the sub-calculations of a*x
    // there are 2*3 sub-calculations with each result being split into the least significant 32 bits and the most significant 32 bits
    uint32_t ax[12]; // 12 = 2*3*2
    for (size_t i = 0; i < 2; i++) { // index x
        for (size_t ii = 0; ii < 3; ii++) { // index a
            uint64_t tmp = (uint64_t)x[i] * (uint64_t)a[ii];
            ax[6*i+2*ii] = (uint32_t)(tmp & 0b1111'1111'1111'1111'1111'1111'1111'1111); // 32 ones
            ax[6*i+2*ii+1] = (uint32_t)(tmp >> 32);
        }
    }
    // calculate y = ax+b
    uint32_t * y = new uint32_t[5];
    uint64_t sum = 0;
    uint32_t carry = 0;
    // calculate bits 0-32
    sum = (uint64_t)ax[10]+(uint64_t)b[2];
    carry = (uint32_t)(sum >> 32);
    y[4] = (uint32_t)(sum & 0b1111'1111'1111'1111'1111'1111'1111'1111); // 32 ones
    // calculate bits 33-64
    sum = (uint64_t)carry + (uint64_t)ax[11] + (uint64_t)ax[8] + (uint64_t)ax[4] + (uint64_t)b[1];
    carry = (uint32_t)(sum >> 32);
    y[3] = (uint32_t)(sum & 0b1111'1111'1111'1111'1111'1111'1111'1111); // 32 ones
    // calculate bits 65-96
    sum = (uint64_t)carry + (uint64_t)ax[9] + (uint64_t)ax[5] + (uint64_t)ax[2] + (uint64_t)ax[6] + (uint64_t)b[0];
    carry = (uint32_t)(sum >> 32);
    y[2] = (uint32_t)(sum & 0b1111'1111'1111'1111'1111'1111'1111'1111); // 32 ones
    // calculate bits 97-128
    sum = (uint64_t)carry + (uint64_t)ax[3] + (uint64_t)ax[7] + (uint64_t)ax[0];
    carry = (uint32_t)(sum >> 32);
    y[1] = (uint32_t)(sum & 0b1111'1111'1111'1111'1111'1111'1111'1111); // 32 ones
    // calculate bits 129-160
    y[0] = ax[1];
    //// calculate modulo p for p=2^89-1
    // y&p
    // we take the 89 first bits
    uint32_t yandp[3];
    yandp[2] = y[4];
    yandp[1] = y[3];
    yandp[0] = (y[2] & 0b11111'11111'11111'11111'11111); // 25 ones
    // y>>q
    // we bitshift 89 times, so we only keep the 5*32 - 89 = 71 most significant bits
    uint32_t yshiftq[3];
    yshiftq[2] = (y[2] >> 25) // keep 7 bits
                 | (y[1] << 7); // keep 25 bits
    yshiftq[1] = (y[1] >> 25) | (y[0] << 7);
    yshiftq[0] = y[0] >> 25;
    // y = (y&p) + (y >> q)
    // bits 0-32
    sum = (uint64_t)yandp[2] + (uint64_t)yshiftq[2];
    carry = (uint32_t)(sum >> 32);
    y[4] = (uint32_t)(sum & 0b1111'1111'1111'1111'1111'1111'1111'1111); // 32 ones
    // bits 33-64
    sum = (uint64_t)carry + (uint64_t)yandp[1] + (uint64_t)yshiftq[1];
    carry = (uint32_t)(sum >> 32);
    y[3] = (uint32_t)(sum & 0b1111'1111'1111'1111'1111'1111'1111'1111); // 32 ones
    // bits 65-71
    y[2] = (uint64_t)carry + (uint64_t)yandp[0] + (uint64_t)yshiftq[0];
    y[1] = 0;
    // y[0] = 0;
    //// if y >= p; y -= p
    // y >= p if bits 90 to 96 are != 0 (actually if bit 90 is set, but this is prettier)
    if ((y[2] >> 25) != 0) {
        // subtracting 2^89-1 is equal to subtracting 2^89 and adding 1.
        // - 2^89
        y[2] = y[2] & 0b1'1111'1111'1111'1111'1111'1111; // 25 ones. We know that bit 91 to 96 are 0
        // + 1
        for (size_t i = 4; i > 1; i--) {
            y[i] += 1;
            if (y[i] != 0)
                break;
        }
    }
    // mod 2^l (mod m)
    return (y[4] >> (32-l));
 }
 uint64_t multiply_shift_c_universal(uint32_t x, uint64_t a, char l) {
    return (a*x) >> (64-l);
 }
 uint64_t multiply_shift_strongly_universal(uint32_t x, uint64_t a, uint64_t b, char l) {
    return (a*x+b) >> (64-l);
 }
 uint64_t multiply_shift_vector(uint32_t * x, uint64_t * seed, size_t d, char l) {
    uint64_t val = 0;
    for (size_t i = 0; i < d; i++)
        val += seed[i]*x[i];
    return (val + seed[d-1]) >> (64-l);
 }
 // requires x to be of size D and the seed to be of size D
 uint64_t multiply_shift_string(const My_string * string, const uint64_t * seed, uint64_t * x, size_t l) {
    size_t d = (string->size+7) >> 3; // d = ceil(string->size/8)
    x[d-1] = 0;
    memcpy(x, string->chars, string->size*sizeof(string->chars[0]));
    uint64_t val = 0;
    for (size_t i = 0; i < d; i++)
        val += (seed[2*i]+(uint32_t)(x[i]>>32))*(seed[2*i+1]+(uint32_t)x[i]);
    return (val + seed[d]) >> (64-l);
 }
 // calculate (ax+b) mod p
 // p=2^89-1 is a Mersenne prime. p > a. p > x. a and x are size 3 arrays of uint32_t.
 // b is a 64 bit integer given as a size 2 array of uint32_t.
 // The result is saved in x.
 void high_bitcount_ax_b_mod_p(uint32_t * x, uint32_t * a, uint32_t * b) {
    // x, a, and b are 89 bit integers given as a 3 long arrays of 32 bit integers.
    // ax: array to hold the sub-calculations of a*x
    // there are 3*3 sub-calculations with each result being split into the least significant 32 bits and the most significant 32 bits
    size_t ax_size = 18; // 18 = 3*3*2
    uint32_t ax[ax_size];
    for (size_t i = 0; i < 3; i++) { // index x
        for (size_t ii = 0; ii < 3; ii++) { // index a
            uint64_t tmp = (uint64_t)x[i] * (uint64_t)a[ii];
            ax[6*i+2*ii] = (uint32_t)(tmp & 0b1111'1111'1111'1111'1111'1111'1111'1111); // 32 ones
            ax[6*i+2*ii+1] = (uint32_t)(tmp >> 32);
        }
    }
    // calculate y = ax+b
    size_t y_size = 6; // 6 = ceil( (89+89+1)/32 )
    uint32_t * y = new uint32_t[y_size];
    uint64_t sum = 0;
    uint32_t carry = 0;
    y[0] = ax[0]+b[0];
    for (size_t index = 1; index < y_size-1; index++) {
        sum = 0;
        for (size_t i = 0; i <= index; i++) {
            size_t ii = index - i;
            sum += ax[6*i+2*ii];
        }
        for (size_t i = 0; i < index; i++) {
            size_t ii = index - i - 1;
            sum += ax[6*i+2*ii+1];
        }
        if (index < 2) {
            sum += b[index];
        }
        carry = (uint32_t)(sum >> 32);
        y[index] = (uint32_t)(sum & 0b1111'1111'1111'1111'1111'1111'1111'1111); // 32 ones
    }
    y[y_size-1] = carry+ax[ax_size-1];
    //// calculate modulo p for p=2^89-1
    // y&p
    // we take the 89 first bits
    uint32_t yandp[3];
    yandp[0] = y[0];
    yandp[1] = y[1];
    yandp[2] = (y[2] & 0b11111'11111'11111'11111'11111); // 25 ones
    // y>>q
    // we bitshift 89 times, and keep the 89 following bits
    uint32_t yshiftq[3];
    yshiftq[0] = (y[2] >> 25) // keep 7 bits
                 | (y[3] << 7); // keep 25 bits
    yshiftq[1] = (y[3] >> 25) | (y[4] << 7);
    yshiftq[2] = (y[4] >> 25) // keep 7 bits
                 | (y[5] << 7); // keep 25 bits, but only 18 of them can be nonzero in practice.
    // y = (y&p) + (y >> q)
    // bits 0-32
    sum = (uint64_t)yandp[0] + (uint64_t)yshiftq[0];
    carry = (uint32_t)(sum >> 32);
    y[0] = (uint32_t)(sum & 0b1111'1111'1111'1111'1111'1111'1111'1111); // 32 ones
    // bits 33-64
    sum = (uint64_t)carry + (uint64_t)yandp[1] + (uint64_t)yshiftq[1];
    carry = (uint32_t)(sum >> 32);
    y[1] = (uint32_t)(sum & 0b1111'1111'1111'1111'1111'1111'1111'1111); // 32 ones
    // bits 65-71
    y[2] = (uint64_t)carry + (uint64_t)yandp[2] + (uint64_t)yshiftq[2];
    // y[3] = 0; // we don't use it anyway
    // y[4] = 0;
    // y[5] = 0;
    //// if y >= p; y -= p
    // y >= p if bits 90 to 96 are != 0 (actually if bit 90 is set, but this is prettier)
    if ((y[2] << 25) != 0) {
        // subtracting 2^89-1 is equal to subtracting 2^89 and adding 1.
        // - 2^89
        y[2] = y[2] & 0b1'1111'1111'1111'1111'1111'1111; // 25 ones. We know that bit 91 to 96 are 0
        // + 1
        for (size_t i = 0; i < 3; i++) {
            y[i] += 1;
            if (y[i] != 0)
                break;
        }
    }
    x[0] = y[0];
    x[1] = y[1];
    x[2] = y[2];
    return;
 }
 // p=2^89-1 is a Mersenne prime.
 // p > a >= 0. p > b >= 0. p > c >= 0. x is a size 2d list of 64 bit integers split into 32 bit integers.
 // We assume a, b, and c are size 3 arrays of 32 bit integers.
 uint32_t polynomial_vector(uint32_t * x, uint32_t * a, uint32_t * b, uint32_t * c, size_t d, char l) {
    uint32_t H[3];
    H[0] = x[0];
    H[1] = x[1];
    for (size_t i = 1; i < d; i++) {
        high_bitcount_ax_b_mod_p(H, c, x+2*i);
    }
    high_bitcount_ax_b_mod_p(H, a, b);
    return H[0] >> (32-l);
 }
 // p=2^89-1 is a Mersenne prime.
 // p > a >= 0. p > b >= 0. p > c >= 0. x is a size 2d list of 64 bit integers split into 32 bit integers.
 // We assume a, b, and c are size 3 arrays of 32 bit integers.
 // we assume the seed to be of size 4 (at minimum).
 uint32_t polynomial_vector_tuned(uint32_t * x, uint32_t * a, uint32_t * b, uint32_t * c, size_t d, char l, const uint64_t * seed) {
    size_t x_remainder = d - ((d >> 2) << 2); // abuse integer division and multiplication (via bitshifts) as modulo
    size_t x_tuned_size = (d >> 2) + 1;
    uint32_t x_tuned[x_tuned_size];
    // prehash chunks of x using the bounded string algorithm
    uint64_t buffer_memory[4];
    char word[256];
    for (size_t i = 0; i <= (d >> 4) - 1; i++ ) { // d 64 bit integers -> d/4 256 char strings
        memcpy(word, x + i*4, 256*sizeof(word[0]));
        My_string str = My_string(word, 256);
        x_tuned[i] = (uint32_t) multiply_shift_string(&str, seed, buffer_memory, 32);
    }
    // prehash the leftovers
    if (x_remainder != 0) {
        memcpy(word, x + d-x_remainder, (x_remainder << 3)*sizeof(word[0]));
        My_string str = My_string(word, (x_remainder << 3));
        x_tuned[x_tuned_size-1] = (uint32_t) multiply_shift_string(&str, seed, buffer_memory, 32);
    }
    return polynomial_vector(x_tuned, a, b, c, x_tuned_size, l);
 }
--- a/fagprojekt_code/hashing_algorithms.hpp
+++ b/fagprojekt_code/hashing_algorithms.hpp
@ -0,0 +1,42 @@
 #ifndef HASHING_ALGORITHMS_H
 #define HASHING_ALGORITHMS_H
 #include "hashed_string.hpp"
 #include <stdint.h>
 // p is prime. p > m > 1, p > a > 0, p > b >= 0
 uint64_t multiply_mod_prime(uint64_t x, uint64_t a, uint64_t b, uint64_t p, uint64_t m);
 // p is a Mersenne prime. p > m > 1, p > a > 0, p > b >= 0
 uint64_t multiply_mod_prime_mersenne(uint64_t x, uint64_t a, uint64_t b, uint64_t p, uint64_t m);
 // p is a Mersenne prime. m=2^q. p > m > 1, p > a > 0, p > b >= 0
 uint64_t multiply_mod_prime_mersenne_overflow(uint64_t x, uint64_t a, uint64_t b, uint64_t p, char q);
 // p is a Mersenne prime. m=2^q. p > m > 1, p > a > 0
 uint64_t multiply_mod_prime_mersenne_overflow_no_b(uint64_t x, uint64_t a, uint64_t p, char q);
 // p=2^89-1 is a Mersenne prime. m=2^l. 32 >= l > 0. p > a > 0, p > b >= 0. x is an 64 bit integer. We assume x, a, and b are arrays of 32 bit integers.
 uint32_t multiply_mod_prime_mersenne_overflow_high_bitcount(uint32_t * x, uint32_t * a, uint32_t * b, char l);
 uint64_t multiply_shift_c_universal(uint32_t x, uint64_t a, char l);
 uint64_t multiply_shift_strongly_universal(uint32_t x, uint64_t a, uint64_t b, char l);
 uint64_t multiply_shift_vector(uint32_t * x, uint64_t * seed, size_t d, char l);
 // requires x to be of size D and the seed to be of size D
 uint64_t multiply_shift_string(const My_string * string, const uint64_t * seed, uint64_t * x, size_t l);
 // p=2^89-1 is a Mersenne prime.
 // p > a >= 0. p > b >= 0. p > c >= 0. x is a size 2d list of 64 bit integers split into 32 bit integers.
 // We assume a, b, and c are size 3 arrays of 32 bit integers.
 uint32_t polynomial_vector(uint32_t * x, uint32_t * a, uint32_t * b, uint32_t * c, size_t d, char l);
 // p=2^89-1 is a Mersenne prime.
 // p > a >= 0. p > b >= 0. p > c >= 0. x is a size 2d list of 64 bit integers split into 32 bit integers.
 // We assume a, b, and c are size 3 arrays of 32 bit integers.
 // we assume the seed to be of size 4 (at minimum).
 uint32_t polynomial_vector_tuned(uint32_t * x, uint32_t * a, uint32_t * b, uint32_t * c, size_t d, char l, const uint64_t * seed);
 #endif
--- a/fagprojekt_code/hashing_speed_comparisons.cpp
+++ b/fagprojekt_code/hashing_speed_comparisons.cpp
@ -0,0 +1,152 @@
 /* #define NDEBUG */
 #include "hash_table.hpp"
 #include <stdlib.h>
 #include <stdio.h>
 #include <string.h>
 #include <chrono>
 #include <iostream>
 #include <bitset>
 #include <fstream>
 #include <ctype.h>
 #include <vector>
 #include <assert.h>
 using namespace std;
 const int max_string_length = 256;
 const int D = (max_string_length+7) >> 3; // D = ceil(max_string_length/size(char))
 My_string * read_word(const char * book, size_t * reading_progress);
 int main() {
    return EXIT_SUCCESS;
 }
 void speedtest_using_hash_table(string title, uint64_t(* algorithm)(const My_string *, const uint64_t *, uint64_t *, size_t), string seed_file) {
    const clock_t clock_before_seed = clock();
    // load seed generated by random.org
    string filename = "random_org_16_bit_numbers.txt";
    std::ifstream seed_file(filename);
    uint16_t seed_part;
    uint16_t seed_parts[D << 2];
    size_t count = 0;
    while (seed_file >> seed_part) {
        seed_parts[count] = seed_part;
        count++;
        if (count == D << 2)
            break; // the seed is large enough for the max_string_length
    }
    if (count != D << 2) {
        cout << "The current seed is not large enough. Please extend it by appending the numbers at https://www.random.org/integers/?num=10000&min=0&max=65535&col=1&base=10&format=plain&rnd=new." << endl;
        return EXIT_SUCCESS;
    }
    // Get 64 bit seed from 16 bit seed
    uint64_t seed[D];
    memcpy(seed, seed_parts, D*sizeof(seed[0]));
    const clock_t clock_before_hash_table = clock();
    size_t l = 1; // initially, hash to a table of up to 1024 distinct words (2^10)
    Hash_table ht = Hash_table(new Hash_function(seed, hash_string, l, D));
    const clock_t clock_before_loading_book = clock();
    // choose a book
    /* std::ifstream ifs("genji_monogatari_english.txt"); */
    /* std::ifstream ifs("Child_of_Light.txt"); */
    /* std::ifstream ifs("the_adventures_of_sherlock_holmes.txt"); */
    /* std::ifstream ifs("dracula.txt"); */
    std::ifstream ifs("the_complete_works_of_william_shakespeare.txt");
    string book_string( (std::istreambuf_iterator<char>(ifs) ),
                    (std::istreambuf_iterator<char>() ) );
    const char * book = book_string.c_str();
    const size_t book_length = book_string.size();
    const clock_t clock_before_reading = clock();
    std::vector<My_string *> words;
    size_t reading_progress = 0;
    while (reading_progress < book_length-1) { // book_length includes '\0' which reading_progress avoids
        My_string * word = read_word(book, &reading_progress);
        if (word->size > 0)
            words.push_back(word);
    }
    const clock_t clock_after_reading = clock();
    size_t count_words = 0;
    for (My_string * word : words) {
        count_words++;
        ht.hash(word);
        if (ht.is_time_for_rehash()) {
            l++; // double the universe which we hashes to
            ht.rehash(new Hash_function(seed, hash_string, l, D));
        }
    }
    const clock_t clock_after_hashing = clock();
    Hash_function hf = Hash_function(seed, hash_string, 10, D);
    const clock_t clock_after_init_hash_function = clock();
    uint64_t hashed_value = 0;
    for (My_string * word : words) {
        /* hf.hash(word); */
        hashed_value += hf.hash(word);
    }
    const clock_t clock_after_hashing_only = clock();
    cout << "Sum of the hashed values (after overflow): " << hashed_value << endl;
    cout << "Nr of words: " << count_words << endl;
    cout << "Distinct words: " << ht.get_distict_words() << endl;
    cout << "Time: Load seed:    " << float( clock_before_hash_table - clock_before_seed ) / CLOCKS_PER_SEC << endl;
    cout << "Time: Init hash table:    " << float( clock_before_loading_book - clock_before_hash_table ) / CLOCKS_PER_SEC << endl;
    cout << "Time: Load book:    " << float( clock_before_reading - clock_before_loading_book ) / CLOCKS_PER_SEC << endl;
    cout << "Time: Read:    " << float( clock_after_reading - clock_before_reading ) / CLOCKS_PER_SEC << endl;
    cout << "Time: Hash & Table:    " << float( clock_after_hashing - clock_after_reading ) / CLOCKS_PER_SEC << endl;
    cout << "Time: Total:    " << float( clock_after_hashing - clock_before_seed ) / CLOCKS_PER_SEC << endl;
    cout << "Time: Init hash function:    " << float( clock_after_init_hash_function - clock_after_hashing ) / CLOCKS_PER_SEC << endl;
    cout << "Time: Hash, no table:    " << float( clock_after_hashing_only - clock_after_init_hash_function ) / CLOCKS_PER_SEC << endl;
    for (My_string * word : words)
        delete word;
 }
 My_string * read_word(const char * book, size_t * reading_progress) {
    bool word_started = false;
    char word[max_string_length];
    size_t word_length = 0;
    char c;
    while (book[*reading_progress+1] != '\0') {
        (*reading_progress)++;
        c = book[*reading_progress];
        if (word_started) {
            if (isalnum(c)) {
                if (word_length != max_string_length) { // crop words longer than the max_string_length
                    word[word_length] = tolower(c);
                    word_length++;
                }
            } else {
                return new My_string(word, word_length);
            }
        } else if (isalnum(c)) {
            word_started = true;
            word[word_length] = c;
            word_length++;
        }
    }
    return new My_string(word, word_length);
 }
--- a/general_library.cpp
+++ b/general_library.cpp
@ -0,0 +1,245 @@
 #include "general_library.hpp"
 // https://en.wikipedia.org/wiki/Extended_Euclidean_algorithm#Modular_integers
 uint32_t multiplicative_inverse(int a, int n) {
    int t = 0, newt = 1, r = n, newr = a;
    while (newr != 0) {
        int quotient = r/newr;
        int tmp = newt;
        newt = t-quotient*newt;
        t = tmp;
        tmp = newr;
        newr = r-quotient*newr;
        r = tmp;
    }
    if (r > 1)
        throw std::runtime_error("Tried to inverse a noninvertible element!");
    if (t < 0)
        t = t + n;
    return t;
 }
 // https://stackoverflow.com/questions/18620942/find-the-smallest-period-of-input-string-in-on
 std::vector<int> calculateLPS(const char * pat, int m) {
    /* int[] lps = new int[pat.length()]; */
    int len = 0;
    int i = 1;
    std::vector<int> lps = {0};
    lps.resize(m);
    while (i < m) {
        if (pat[i] == pat[len]) {
            len++;
            lps[i] = len;
            i++;
        }
        else {
            if (len != 0) {
                len = lps[len - 1];
            }
            else {
                lps[i] = len;
                i++;
            }
        }
    }
    return lps;
 }
 // calculates the length of the shortest period
 int len_of_shortest_period (const char * pattern, int m) {
    std::vector<int> lps = calculateLPS(pattern, m);
    //start at the end of the string
    int i = lps.size()-1;
    while (lps[i] != 0) {
        //shift back
        i -= lps[i];
    }
    return i+1;
 }
 // SECTION: Functions related to calculating with polynomials in Z2[x]
 uint32_t irreducible_polynomials[] {
    0b11,                              // irreducible polynomial of degree 1
    0b111,                             // irreducible polynomial of degree 2
    0b1011,                            // irreducible polynomial of degree 3
    0b10011,                           // irreducible polynomial of degree 4
    0b100101,                          // irreducible polynomial of degree 5
    0b1011011,                         // irreducible polynomial of degree 6
    0b10000011,                        // irreducible polynomial of degree 7
    0b100011101,                       // irreducible polynomial of degree 8
    0b1000010001,                      // irreducible polynomial of degree 9
    0b10001101111,                     // irreducible polynomial of degree 10
    0b100000000101,                    // irreducible polynomial of degree 11
    0b1000011101011,                   // irreducible polynomial of degree 12
    0b10000000011011,                  // irreducible polynomial of degree 13
    0b100000010101001,                 // irreducible polynomial of degree 14
    0b1000000000110101,                // irreducible polynomial of degree 15
    0b10000000000101101,               // irreducible polynomial of degree 16
    0b100000000000001001,              // irreducible polynomial of degree 17
    0b1000001010000000011,             // irreducible polynomial of degree 18
    0b10000000000000100111,            // irreducible polynomial of degree 19
    0b100000000011011110011,           // irreducible polynomial of degree 20
    0b1000000000000001100101,          // irreducible polynomial of degree 21
    0b10000000001111101100001,         // irreducible polynomial of degree 22
    0b100000000000000000100001,        // irreducible polynomial of degree 23
    0b1000000011110011010101001,       // irreducible polynomial of degree 24
    0b10000000000000000101000101,      // irreducible polynomial of degree 25
    0b100000000000100010111010011,     // irreducible polynomial of degree 26
    0b1000000000000001011010101101,    // irreducible polynomial of degree 27
    0b10000000000000010000011100101,   // irreducible polynomial of degree 28
    0b100000000000000000000000000101,  // irreducible polynomial of degree 29
    0b1000000000000110010100010101111, // irreducible polynomial of degree 30
    0b10000000000000000000000000001001 // irreducible polynomial of degree 31
 };
 size_t degree (uint32_t polynomial) {
    return 31 - __builtin_clz(polynomial);
 }
 uint32_t multiply_modulo_polynomials_in_Z2 (uint32_t q1, uint32_t q2, uint32_t p) {
    size_t p_degree = degree(p);
    size_t q1_degree = degree(q1);
    size_t q2_degree = degree(q2);
    if (q1_degree > p_degree)
        throw std::logic_error("We only support multiply-modulo whenever the multiplied polynomials are initially at most the same degree as the modulo polynomial.");
    if (q1_degree == p_degree)
        q1 ^= p;
    uint32_t arr[q2_degree+1];
    arr[0] = q1;
    for (size_t i = 1; i <= q2_degree; i++) {
        arr[i] = arr[i-1]<<1;
        if (degree(arr[i]) == p_degree)
            arr[i] ^= p;
    }
    uint32_t sum = 0;
    std::bitset<32> b(q2);
    for (size_t i = 0; i <= q2_degree; i++) {
        if (b[i] == 1)
            sum ^= arr[i];
    }
    return sum;
 }
 uint32_t polynomial_power_in_Z2(uint32_t q, uint32_t exp, uint32_t p) {
    if (exp == 0)
        return 1;
    if (degree(q) == degree(p))
        q ^= p;
    size_t log2exp = degree(exp) + 1;
    uint32_t arr[log2exp];
    arr[0] = q;
    for (size_t i = 1; i < log2exp; i++)
        arr[i] = multiply_modulo_polynomials_in_Z2(arr[i-1], arr[i-1], p);
    uint32_t res = 1;
    std::bitset<32> b(exp);
    for (size_t i = 0; i <= log2exp; i++) {
        if (b[i] == 1)
            res = multiply_modulo_polynomials_in_Z2(res, arr[i], p);
    }
    return res;
 }
 void rref_Z2(std::vector<std::bitset<32>> &A, size_t m, size_t n) {
    if (m > 31 || n > 32)
        throw std::logic_error("We only support rref_Z2 for up to a (31x32)-matrix.");
    // calculate row echelon form
    // https://en.wikipedia.org/wiki/Gaussian_elimination#Pseudocode
    size_t h = 0; // Initialization of the pivot row
    size_t k = 0; // Initialization of the pivot column
    while (h < m && k < n) {
        // Find the k-th pivot:
        int i_max = -1;
        for (size_t i = h; i < m; i++) {
            if (A[i][k]) {
                i_max = i;
                break;
            }
        }
        if (i_max == -1) {
            // No pivot in this column, pass to next column
            k++;
        } else {
            auto tmp = A[i_max];
            A[i_max] = A[h];
            A[h] = tmp;
            // Do for all rows below pivot:
            for (size_t i = h+1; i < m; i++){
                bool f = A[i][k];
                if (f == 0)
                    continue;
                // Fill with zeros the lower part of pivot column:
                A[i][k] = 0;
                // Do for all remaining elements in current row:
                for (size_t j = k+1; j<n; j++) {
                    A[i][j] = A[i][j] ^ A[h][j];
                }
            }
            // Increase pivot row and column
            h++;
            k++;
        }
    }
    // Perform back substitution
    for (size_t i = 1; i < m; i++) {
        for (size_t j = 0; j < i; j++) {
            if (A[j][i] == 1) {
                for (size_t l = i; l < n; l++) // check this
                    A[j][l] = A[j][l] ^ A[i][l];
            }
        }
    }
 }
 uint32_t get_random_irreducible_polynomial_in_Z2 (size_t k) {
    if (k > 31)
        throw std::logic_error("We only support polynomials of degree 31 or less.");
    uint32_t init_p = irreducible_polynomials[k-1];
    srand(time(0));
    uint32_t gamma = (rand() % (((uint32_t)1 << (k+1)) - 2)) + 2; // gamma in GF(2^k)\GF(2)
    uint32_t gamma_pow[k+1];
    for (size_t i = 0; i <= k; i++)
        gamma_pow[i] = polynomial_power_in_Z2(gamma, i, init_p);
    // Create an array of the polynomials in gamma_pow, and transpose it at the same time
    std::vector<std::bitset<32>> A(k); // NOTE: That 32 > 31 >= k
    for (size_t i = 0; i < k; i++) {
        for (size_t j = 0; j <= k; j++) {
            A[i][k-j] = gamma_pow[j] & ((uint32_t)1<<i);
        }
    }
    rref_Z2(A, k, k+1);
    std::bitset<32> bp;
    for (size_t i = 0; i < k; i++) {
        bp[i] = A[i][k];
    }
    bp[k] = 1;
    uint32_t p = (uint32_t)bp.to_ulong();
    return p;
 }
--- a/general_library.hpp
+++ b/general_library.hpp
@ -0,0 +1,17 @@
 #ifndef GENERAL_LIBRARY_H
 #define GENERAL_LIBRARY_H
 #include <stdlib.h>
 #include <stdint.h>
 #include <stdexcept>
 #include <vector>
 #include <bitset>
 #include <iostream>
 uint32_t multiplicative_inverse(int a, int n);
 int len_of_shortest_period(const char * pattern, int m);
 // SECTION: Functions related to calculating with polynomials in Z2[x]
 uint32_t get_random_irreducible_polynomial_in_Z2 (size_t k);
 #endif
--- a/generate_initial_irreducible_polynomials.sage
+++ b/generate_initial_irreducible_polynomials.sage
@ -0,0 +1,12 @@
 F = GF(2)
 PR = PolynomialRing(F, 'x')
 max_k = 31
 whitespace = max_k+1
 for i in range(1, max_k+1):
    poly_int = '0b'+ ''.join(map(str, PR.irreducible_element(i).coefficients(sparse=False)[::-1]))
    poly_int += ','
    poly_int += ' '*(max_k-i)
    print(f'    {poly_int}// irreducible polynomial of degree {i}')
--- a/generate_random_irreducible_polynomial.sage
+++ b/generate_random_irreducible_polynomial.sage
@ -0,0 +1,96 @@
 k = 31
 F = GF(2)
 E = GF(2^k)
 PR = PolynomialRing(F, 'x')
 p = PR.irreducible_element(k)
 while(True):
    gamma = E.random_element()
    if gamma not in F:
        break
 # gamma = PR('x^3+x')
 # print('0b'+ ''.join(map(str, gamma.coefficients(sparse=False)[::-1])))
 eqs = [PR(gamma)^i % p for i in range(k+1)]
 for eq in eqs:
    print(eq)
 print()
 eqs = list(map(lambda eq: eq.coefficients(sparse=False) + [0]*(k-eq.degree()-1), eqs))
 for eq in eqs:
    print(eq)
 print()
 eqs = matrix(eqs[::-1])
 print(eqs)
 print()
 eqs = eqs.transpose()
 print(eqs)
 print()
 rref = eqs.rref()
 print(rref)
 irrpol = PR(rref[:,-1].list() + [1])
 print(irrpol)
 print(irrpol.is_irreducible())
 print()
 # manual rref
 def calc_rref_Z2(A, m, n):
    """Calculate the reduced row echelon form of a (mxn)-matrix"""
    A = copy(A)
    # calculate row echelon form
    # https://en.wikipedia.org/wiki/Gaussian_elimination#Pseudocode
    h = 0 # Initialization of the pivot row
    k = 0 # Initialization of the pivot column
    while h < m and k < n:
        # Find the k-th pivot:
        i_max = -1
        for i in range(h, m):
            if A[i,k] == 1:
                i_max = i
                break
        if i_max == -1:
            # No pivot in this column, pass to next column
            k += 1
        else:
            tmp = A[i_max, :]
            A[i_max, :] = A[h, :]
            A[h, :] = tmp
            # Do for all rows below pivot:
            for i in range(h+1, m):
                f = A[i][k];
                if f == 0:
                    continue;
                A[i, k] = 0;
                for j in range(k+1, n):
                    A[i, j] = A[i, j] - A[h, j]
            # Increase pivot row and column
            h += 1
            k += 1
    # perform back substitution
    for i in range(1, m):
        for j in range(i):
            if A[j, i] == 1:
                A[j, :] -= A[i, :]
    return A
 print('Manual RREF:\n')
 rref = calc_rref_Z2(eqs, k, k+1) # cols = rows+1, since we transposed the matrix
 print(rref)
 print()
 irrpol = PR(rref[:,-1].list() + [1])
 print(irrpol)
 print(irrpol.is_irreducible())
 print()
 print('0b'+ ''.join(map(str, irrpol.coefficients(sparse=False)[::-1])))
--- a/hash_function_library.cpp
+++ b/hash_function_library.cpp
@ -0,0 +1,106 @@
 #include "hash_function_library.hpp"
 int Rolling_hash::get_fingerprint() {
    return (int)fingerprint;
 }
 Rabin_karp::Rabin_karp(uint32_t p, size_t length) : p(p) {
    for (size_t i = 0; i < length; i++)
        elements.push(0);
    if (p >= (uint32_t)(1<<31))
        throw std::overflow_error("A Rabin-Karp hash function has been initialized with too large a prime, such that we will encounter overflow errors.");
    xi = (2 << length) % p;
 }
 void Rabin_karp::slide(unsigned char c_in) {
    unsigned char c_out = elements.front();
    elements.pop();
    elements.push(c_in);
    for (size_t i = 7; i >= 0; i--) {
        bool bit_in = (c_in & (1 << i)) != 0;
        bool bit_out = (c_out & (1 << i)) != 0;
        slide_bit(bit_in, bit_out);
    }
 }
 void Rabin_karp::slide_bit(bool bit_in, bool bit_out) {
    fingerprint = ((fingerprint << 1) - xi*bit_out + bit_in);
    // fast mod p
    if (fingerprint > (uint32_t)p)
        fingerprint -= p;
 }
 Polynomial_fingerprint::Polynomial_fingerprint(int32_t p, int32_t r) : p(p), r(r) {}
 void Polynomial_fingerprint::push(unsigned char c) {
    int exp = elements.size() % (p-1);
    fingerprint = (fingerprint + c*(unsigned int)pow(r, exp)) % p;
    elements.push(c);
 }
 void Polynomial_fingerprint::shift(size_t i) {
    int32_t subtract_fingerprint = 0;
    for (size_t ii = 0; ii < i; ii++) {
        unsigned char c = elements.front();
        elements.pop();
        int exp = (ii+1) % (p-1);
        subtract_fingerprint += c*pow(r, exp);
    }
    fingerprint = (fingerprint-subtract_fingerprint)*multiplicative_inverse(pow(r, i), p) % p;
 }
 Porat_porat_polynomial_fingerprint::Porat_porat_polynomial_fingerprint(std::string P, int32_t p, int32_t r) : p(p), r(r) {
    // Calculate the shortest periods for all prefixes of length 2^i (and the full pattern)
    {
        size_t i = 1;
        const char * P_c_str = P.c_str();
        while (i < P.length()) {
            shortest_periods.push_back(len_of_shortest_period(P_c_str, i));
            i <<= 1;
        }
        shortest_periods.push_back(len_of_shortest_period(P_c_str, P.length()));
    }
    // Calculate the fingerprints of all prefixes of length 2^i, and of the shortest periods found before
    {
        size_t next_2_exponent = 1;
        size_t shortest_period_index = 0;
        for (size_t i = 0; i < P.length(); i++) {
            if (i == next_2_exponent) {
                if (!prehashed_indices.contains(i)) {
                    prehashed_values.push_back(get_fingerprint());
                    prehashed_indices[i] = prehashed_values.size()-1;
                }
            }
            else if (shortest_period_index < shortest_periods.size() && i == shortest_periods[shortest_period_index]) {
                if (!prehashed_indices.contains(i)) {
                    prehashed_values.push_back(get_fingerprint());
                    prehashed_indices[i] = prehashed_values.size()-1;
                }
                shortest_period_index++;
            }
            else {
                push(P[i]);
            }
        }
        // We have now pushed the entire pattern
        prehashed_values.push_back(get_fingerprint());
        prehashed_indices[P.length()] = prehashed_values.size()-1;
    }
    // Save the length of the pattern before we throw the pattern away
    m = P.length();
 }
 void Porat_porat_polynomial_fingerprint::push(unsigned char c){
    // TODO
 }
 void Porat_porat_polynomial_fingerprint::shift(size_t i){
    // TODO
 }
--- a/hash_function_library.hpp
+++ b/hash_function_library.hpp
@ -0,0 +1,108 @@
 #ifndef HASH_LIBRARY_H
 #define HASH_LIBRARY_H
 #include <stdlib.h>
 #include <stdint.h>
 #include <math.h>
 #include <string>
 #include <queue>
 #include <stdexcept>
 #include <map>
 #include "general_library.hpp"
 class Rolling_hash {
    public:
        // pushes element
        virtual void push(unsigned char c);
        // shifts i indices
        // the hash function should already know the values
        virtual void shift(size_t i);
        virtual void slide(unsigned char c);
        int get_fingerprint();
    private:
        int fingerprint;
 };
 class Rabin_karp : Rolling_hash {
    // Hash function: sum_{i=1}^n x_i*2^{n-i} mod p
    // With X being a binary string
    public:
        // Let prime `p` be an int32_t, which ensures that it is small enough to avoid underflows
        Rabin_karp(uint32_t p, size_t length);
        void slide(unsigned char c);
    private:
        void slide_bit(bool bit_in, bool bit_out);
        std::queue<unsigned char> elements;
        uint32_t fingerprint = 0;
        uint32_t xi; // 2^n mod p
        uint32_t p; // prime
 };
 class Polynomial_fingerprint : Rolling_hash {
    // Hash function: sum_{i=1}^l s_i*r^i mod p
    // r in F_p
    // TODO: Add some overflow warning
    // TODO: Untested
    public:
        Polynomial_fingerprint(int32_t p, int32_t r);
        void push(unsigned char c);
        void shift(size_t i);
    private:
        std::queue<unsigned char> elements;
        int32_t fingerprint = 0;
        int32_t p; // prime
        int32_t r; // r in F_p
 };
 class Porat_porat_polynomial_fingerprint : Rolling_hash {
    // Hash function: sum_{i=1}^l s_i*r^i mod p
    // r in F_p
    // TODO: Add some overflow warning
    // TODO: Untested
    public:
        Porat_porat_polynomial_fingerprint(std::string P, int32_t p, int32_t r);
        void push(unsigned char c);
        void shift(size_t i);
        bool should_children_be_killed();
        int get_generation();
        int get_child();
    protected:
        // TODO: Optimize the code such that we don't copy the prehashed values, but instead share it between all instances.
        //       I guess we would have to store it in a separate object, and then pass a reference to it around (to avoid it getting destroyed early).
        Porat_porat_polynomial_fingerprint(int32_t p, int32_t r, std::vector<int32_t> prehashed_values, std::vector<unsigned int> shortest_periods, std::map<unsigned int, unsigned int> prehashed_indices);
    private:
        std::queue<unsigned char> elements;
        int32_t fingerprint = 0;
        int32_t p; // prime
        int32_t r; // r in F_p
        size_t m; // pattern length
        std::vector<int32_t> prehashed_values;
        std::vector<unsigned int> shortest_periods;
        std::map<unsigned int, unsigned int> prehashed_indices;
 };
        /* void push(const char * cs, size_t n) { */
        /*     for (size_t i = 0; i < n; i++) */
        /*         push(cs[i]); */
        /* } */
        /* void push(std::string s) { */
        /*     for (char c : s) */
        /*         push(c); */
        /* } */
 #endif
--- a/multiply_polynomials_modulo_polynomial.sage
+++ b/multiply_polynomials_modulo_polynomial.sage
@ -0,0 +1,68 @@
 import math
 k = 31
 F = GF(2)
 var = 'x'
 PR = PolynomialRing(F, var)
 p = PR.irreducible_element(k)
 gamma = PR.random_element(k)
 exp = 10
 target = gamma^exp % p
 def polynomial_power_in_Z2(q, exp, p, var):
    if exp == 0:
        return 1
    if q.degree() == p.degree():
        q += p
    res = q
    for i in range(2, exp+1):
        res = multiply_polynomials_in_Z2(res, q, p, var)
    return res
 def polynomial_power_in_Z2_V2(q, exp, p, var):
    if exp == 0:
        return 1
    if q.degree() == p.degree():
        q += p
    log2deg = math.floor(math.log2(exp)) + 1
    arr = [0]*log2deg
    arr[0] = q
    for i in range(1, log2deg):
        arr[i] = multiply_polynomials_in_Z2(arr[i-1], arr[i-1], p, var)
    res = PR(1)
    for i, b in enumerate(bin(exp)[:1:-1]):
        if b == '1':
            res = multiply_polynomials_in_Z2(res, arr[i], p, var)
    return res
 def multiply_polynomials_in_Z2(q1, q2, p, var):
    if q1.degree() > p.degree():
        raise ValueError('Unsupported!')
    if q1.degree() == p.degree():
        q1 += p
    arr = [0]*(q2.degree()+1)
    arr[0] = q1
    for i in range(1, q2.degree()+1):
        arr[i] = arr[i-1]*PR(var)
        if arr[i].degree() == p.degree():
            arr[i] += p
    return sum(arr[i] for i in q2.exponents())
 print(target)
 res = polynomial_power_in_Z2(gamma, exp, p, var)
 print(res)
 res = polynomial_power_in_Z2_V2(gamma, exp, p, var)
 print(res)
--- a/porat-porat.cpp
+++ b/porat-porat.cpp
@ -0,0 +1,226 @@
 /* #define NDEBUG */
 #include <stdlib.h>
 #include <string>
 #include <vector>
 #include <iostream>
 #include <map>
 #include <thread>
 #include <math.h>
 #include <string_view>
 #include "hash_function_library.hpp"
 // Initialization of constants
 int p = 7919; // the prime for our hash function
 int r = 11; // random int in \in F_p
 char T[] = "abcabcabcdabc"; // text
 /* char P[] = "abcabc"; // pattern */
 char P[] = "abcabcabcabcabcabcddddddddddddddddddabc"; // pattern
 std::vector<long> prehashed_values;
 std::vector<int> shortest_periods;
 std::map<int, int> prehashed_indices;
 // https://stackoverflow.com/questions/18620942/find-the-smallest-period-of-input-string-in-on
 // BEGIN stolen code
 std::vector<int> calculateLPS(char * pat, int m) {
    /* int[] lps = new int[pat.length()]; */
    int len = 0;
    int i = 1;
    std::vector<int> lps = {0};
    lps.resize(m);
    while (i < m) {
        if (pat[i] == pat[len]) {
            len++;
            lps[i] = len;
            i++;
        }
        else {
            if (len != 0) {
                len = lps[len - 1];
            }
            else {
                lps[i] = len;
                i++;
            }
        }
    }
    return lps;
 }
 // calculates the length of the shortest period
 int len_of_shortest_period (char * pattern, int m) {
    std::vector<int> lps = calculateLPS(pattern, m);
    //start at the end of the string
    int i = lps.size()-1;
    while (lps[i] != 0) {
        //shift back
        i -= lps[i];
    }
    return i+1;
 }
 // END
 class porat_process {
    // TODO: use a different hash function. This one is BAD
    public:
        // we use the polynomial fingerprint
        void increment_hash (char c) {
            prev_pow = prev_pow*r % p;
            hash = (hash + c*prev_pow) % p;
            l++;
        }
        void subtract_hash (long pre_fingerprint, int i) {
            // i is the number of removed elements
            // pre_fingerprint is the fingerprint of those previous elements
            hash = (hash - pre_fingerprint)/(long)pow(r, i); // we are guaranteed that integer division will return a whole number
            prev_pow /= (long)pow(r, i);
            l -= i;
            // TODO: untested, especially prev_pow
        }
        bool should_spawn_child() {
            if (l == next_i_squared) {
                next_i_squared <<= 1;
                return true;
            }
            else
                return false;
        }
        long get_fingerprint() {
            return hash;
        }
    private:
        long prev_pow = 1;
        int l = 0;
        int next_i_squared = 1;
        long hash = 0;
 };
 void print_map(std::string_view comment, const std::map<int, int>& m)
 {
    std::cout << comment;
    for (const auto& [key, value] : m) {
        std::cout << key << " = " << value << "; ";
    }
    std::cout << "\n";
 }
 void print_vector(std::string_view comment, const std::vector<int>& m)
 {
    std::cout << comment << "[";
    for (const auto& a : m) {
        std::cout << a << ", ";
    }
    std::cout << "]\n";
 }
 void print_vector_long(std::string_view comment, const std::vector<long>& m)
 {
    std::cout << comment << "[";
    for (const auto& a : m) {
        std::cout << a << ", ";
    }
    std::cout << "]\n";
 }
 int main() {
    int n = sizeof(T)/sizeof(char) - 1;
    int m = sizeof(P)/sizeof(char) - 1;
    {
        int i = 1;
        while (i < m) {
            // calculate shortest period length
            int period = len_of_shortest_period(P, i);
            shortest_periods.push_back(period);
            // calculate fingerprint of period
            if (!prehashed_indices.contains(period)) {
                porat_process process;
                for (int ii = 0; ii < period; ii++){
                    std::cout << P[ii];
                    process.increment_hash(P[ii]);
                }
                /* prehashed_indices[period] = process.get_fingerprint(); */
                prehashed_values.push_back(process.get_fingerprint());
                std::cout << period << " " << prehashed_values.size() << std::endl;
                prehashed_indices[period] = prehashed_values.size()-1;
            }
            i <<= 1;
        }
        if (i != m) { // so i>m, which means we skipped exactly m
            // calculate shortest period length
            int period = len_of_shortest_period(P, m);
            shortest_periods.push_back(period);
            // calculate fingerprint of period
            if (!prehashed_indices.contains(period)) {
                porat_process process;
                std::cout << "[";
                for (int ii = 0; ii < period; ii++) {
                    std::cout << P[ii];
                    process.increment_hash(P[ii]);
                }
                std::cout << "]\n";
                prehashed_values.push_back(process.get_fingerprint());
                std::cout << period << " " << prehashed_values.size() << std::endl;
                prehashed_indices[period] = prehashed_values.size()-1;
            }
            /* // calculate fingerprint of phi(P_{2^i}) */
            /* while (ii < m) { */
            /*     process.increment_hash(P[ii]); */
            /*     ii++; */
            /* } */
            /* prehashed_values.push_back(process.get_fingerprint()); */
        }
    }
    {
        std::cout << P << std::endl;
        int i = 0;
        while ((1 << i) < m) {
            std::cout << "pattern: ";
            for (int ii = 0; ii < (1 << i); ii++)
                std::cout << P[ii];
            std::cout << std::endl;
            std::cout << "period:  ";
            for (int ii = 0; ii < shortest_periods[i]; ii++)
                std::cout << P[ii];
            std::cout << std::endl;
            std::cout << "|prefix_{P_" << (1 << i) << "}| = " << shortest_periods[i] << std::endl;
            std::cout << prehashed_values[prehashed_indices[shortest_periods[i]]] << std::endl;
            i++;
        }
        if ((1 << i) != m) { // so i>m, which means we skipped exactly m
            std::cout << "pattern: ";
            for (int ii = 0; ii < m; ii++)
                std::cout << P[ii];
            std::cout << std::endl;
            std::cout << "period:  ";
            for (int ii = 0; ii < shortest_periods[i]; ii++)
                std::cout << P[ii];
            std::cout << std::endl;
            std::cout << "|prefix_{P_" << m << "}| = " << shortest_periods[i] << std::endl;
            std::cout << prehashed_values[prehashed_indices[shortest_periods[i]]] << std::endl;
            std::cout << prehashed_values[0] << std::endl;
            std::cout << prehashed_values[1] << std::endl;
            std::cout << prehashed_values[2] << std::endl;
            std::cout << prehashed_values[3] << std::endl;
            std::cout << prehashed_values[4] << std::endl;
        }
    }
    print_map("Indices map: ", prehashed_indices);
    print_vector_long("Values vector: ", prehashed_values);
    print_vector("Periods vector: ", shortest_periods);
    return EXIT_SUCCESS;
 }
--- a/BIN
+++ b/BIN
--- a/simple_string_matching.cpp
+++ b/simple_string_matching.cpp
@ -0,0 +1,65 @@
 /* #define NDEBUG */
 #include "Rabin_fingerprint.hpp"
 #include "general_library.hpp"
 #include <iostream>
 #include <stdint.h>
 #include <math.h>
 #include <string>
 #include <fstream>
 void print_match (size_t index, size_t length, std::string &T) {
    std::cout << "Match found at index " << index << " with the text \"";
    for (size_t i = 0; i < length; i++)
        std::cout << T[index + i];
    std::cout << "\"" << std::endl;
 }
 int main() {
    /* std::ifstream ifs("books/the_complete_works_of_william_shakespeare.txt"); */
    std::ifstream ifs("books/genji_monogatari_english.txt");
    std::string T( (std::istreambuf_iterator<char>(ifs) ),
                    (std::istreambuf_iterator<char>() ) );
    /* std::string T = "Hello, this is my test string averylongword is a necessary word to exceed the 32 bit window."; */
    // Test without the modulo polynomial - and two matches
    std::string P = "word";
    // Test with the modulo polynomial
    /* std::string P = "averylongword"; */
    std::cout << "Searching for pattern:" << std::endl;
    std::cout << "    " << P << std::endl;
    /* std::cout << "in text:" << std::endl; */
    /* std::cout << "    " << T << std::endl; */
    std::cout << std::endl;
    /* uint32_t polynomial = pow(2, 30) + pow(2, 2) + 1; // x^31 + x^3 + 1 */
    uint32_t polynomial = get_random_irreducible_polynomial_in_Z2(31);
    /* uint32_t polynomial = 0b11010011100100000111101011110111; */
    // Test without the modulo polynomial
    size_t window_size_in_bits = P.length()*8;
    // Hash the pattern
    Rabin_fingerprint fP(polynomial, window_size_in_bits);
    for (char c : P)
        fP.push_char(c);
    // Hash the text
    Rabin_fingerprint fT(polynomial, window_size_in_bits);
    for (size_t i = 0; i < P.length(); i++)
        fT.push_char(T[i]);
    if (fT.get_fingerprint() == fP.get_fingerprint())
        print_match(0, P.length(), T);
    for (size_t i = P.length(); i < T.length(); i++) {
        fT.slide_char(T[i], T[i-P.length()]);
        if (fT.get_fingerprint() == fP.get_fingerprint())
            print_match(i-P.length()+1, P.length(), T);
    }
    std::cout << std::endl;
    std::cout << "Done!" << std::endl;
    return EXIT_SUCCESS;
 }
--- a/test_rabin_fingerprint.sage
+++ b/test_rabin_fingerprint.sage
@ -0,0 +1,97 @@
 from random import randint
 F = GF(2)
 PR = PolynomialRing(F, 'x')
 k = 31
 P = PR.irreducible_element(k)
 m = 100
 # Test the calculation for moving the left edge of the sliding window
 for _ in range(1):
    q = tuple(randint(0, 1) for _ in range(m))
    for i in range(1, m+1):
        for j in range(i+1, m+1):
            assert (PR(q[:i]) % P) == (PR(q) % P) - (PR(f'x^{i}')*PR(q[i:]) % P)
 # Moving the right side of the window is as described in the Rabin Fingerprint article
 # Next step (TODO)
 # pattern     = (1,0,1,1,1,1,0,1,1,0,1,0,1,0,1,1,1,1,1,0,0,1,0,0,0,1)
 # period      = (1,0,1,1,1,1,0,1,1,0,1,0,1,0,1,1,1,1,1,0,0,1,0,0,0)
 # m           = len(pattern)
 # s_period    = tuple(list(period)+[0]*(m-len(period)))
 # pattern_1   = (1)
 # period_1    = (1)
 # s_period_1  = tuple(list(period_1)+[0]*(m-len(period_1)))
 # pattern_2   = (1,0)
 # period_2    = (1,0)
 # s_period_2  = tuple(list(period_2)+[0]*(m-len(period_2)))
 # pattern_4   = (1,0,1,1)
 # period_4    = (1,0,1)
 # s_period_4  = tuple(list(period_4)+[0]*(m-len(period_4)))
 # pattern_8   = (1,0,1,1,1,1,0,1)
 # period_8    = (1,0,1,1,1)
 # s_period_8  = tuple(list(period_8)+[0]*(m-len(period_8)))
 # pattern_16  = (1,0,1,1,1,1,0,1,1,0,1,0,1,0,1,1)
 # period_16   = (1,0,1,1,1,1,0,1,1,0,1,0)
 # s_period_16 = tuple(list(period_16)+[0]*(m-len(period_16)))
 # for i in range(len(pattern)-len(pattern_4)-len(period_4)):
 #     assert PR(pattern[i+len(period_4):i+len(pattern_4)+len(period_4)]) == PR(pattern[i:i+len(pattern_4)] + pattern[i+len(pattern_4):i+len(pattern_4)+len(period_4)]) - PR(s_period_4)
    # assert PR(pattern[i+len(period_4):i+len(pattern_4)+len(period_4)]) == pattern[i-len(period_4):i+len(pattern_4)-len(period_4)]+pattern[i+len(pattern_4)-len(period_4):i+len(pattern_4)-len(period_4)] - PR(s_period_4)
 # Does the bits of a prime number correspond to the coefficients of an irreducible polynomial?
 k = 31
 reducible = 0
 irreducible = 0
 for p in Primes()[200000000:200010000]:#[100000:100000]:
 # for p in range(2147483648,2147483648+10000):
    poly = PR(tuple(bin(p)[2:][::-1]))
    # print(f'{poly.degree()}')
    if poly.degree() > k:
        break
    if poly.degree() != k:
        continue
    irr = poly.is_irreducible()
    # print(f'The polynomial {poly}, corresponding to the prime {p}, being an irreducible polynomial is {irr}.')
    if irr:
        irreducible += 1
    else:
        reducible += 1
 print(f'{irreducible}/{reducible+irreducible} of the primes correspond to irreducible polynomials. That is {float(irreducible/(reducible+irreducible))*100}%')
 progress = 0
 the_same = 0
 different = 0
 for p in Primes()[200000000:200010000]:
    progress += 1
    print(f'\r{progress}/10000', end='')
    p_poly = PR(tuple(bin(p)[2:][::-1]))
    if not p_poly.is_irreducible():
        continue
    # i = p + randint(1,2**29)
    i = p + randint(1,p-1)
    # print(f'{i}, {p}, {2*p}, {i%p}')
    i_poly = PR(tuple(bin(i)[2:][::-1]))
    i_mod_p = i % p
    i_mod_p_poly = PR(tuple(bin(i_mod_p)[2:][::-1]))
    # print(f'i_poly: {i_poly}')
    # print(f'p_poly: {p_poly}')
    # print(f'i_mod_p_poly: {i_mod_p_poly}')
    if i_mod_p_poly == i_poly % p_poly:
        the_same += 1
    else:
        different += 1
    # if not i_mod_p_poly == i_poly - (p_poly - PR(f'x^{p_poly.degree()}')):
    # if not i_mod_p_poly == i_poly % p_poly:
    #     print()
    #     print('ERROR')
    #     print(i_mod_p_poly)
    #     # print(i_poly - (p_poly - PR(f'x^{p_poly.degree()}')))
    #     print(i_poly % p_poly)
    #     break
    # assert i_mod_p_poly == i_poly - (p_poly - PR(f'x^{p_poly.degree()}'))
 print()
 print(f'{the_same}/{the_same+different} are the same as if we did polynomial calculations. This is {float(the_same/(the_same+different))*100}%')