# Load the Python libraries
import math
import random
import timeit
import numpy as np
from scipy import stats as sci
import statistics as stats
from itertools import cycle


# Load plotting libraries
import matplotlib.pyplot as plt


# Example values
m = 12000000
n = 76000000


# Function that returns the GCD of two values (intuitive algorithn)
def gcd_simple(m, n):
    i = min(m, n)
    
    while (m % i != 0) or (n % i != 0):
        i -= 1
        
    return i


start_time = timeit.default_timer()
print(gcd_simple(m, n))
print('>> elapsed time', (timeit.default_timer() - start_time) * 1000, 'ms')

4000000
>> elapsed time 1080.9609 ms


# Function that returns the GCD of two values (euclidean algorithm)
def gcd_euclidean(m, n):
    m = min(m, n)
    n = max(m, n)
    
    while m > 0:
        t = m
        m = n % m
        n = t
    
    return n


start_time = timeit.default_timer()
print(gcd_euclidean(m, n))
print('>> elapsed time', (timeit.default_timer() - start_time) * 1000, 'ms')

4000000
>> elapsed time 1.6196000000001654 ms


# Example value
n = 35


# Function that returns the n-fibonacci value (recursive algorithm)
def fibo_rec(n):
    if n < 2:
        return n
    else:
        return fibo_rec(n - 1) + fibo_rec(n - 2)


start_time = timeit.default_timer()
print(fibo_rec(n))
print('>> elapsed time', (timeit.default_timer() - start_time) * 1000, 'ms')

9227465
>> elapsed time 5066.8688 ms


# Function that returns the n-fibonacci value (iterative algorithm)
def fibo_iter(n):
    i, j = 1, 0
    
    for k in range(n):
        j = i + j
        i = j - i
    
    return j


start_time = timeit.default_timer()
print(fibo_iter(n))
print('>> elapsed time', (timeit.default_timer() - start_time) * 1000, 'ms')

9227465
>> elapsed time 0.9330999999992429 ms


# Function that returns the n-fibonacci value (De Moivre equation)
def fibo_de_moivre(n):
    golden_ratio = (1 + 5**(1/2)) / 2
    f = (golden_ratio**n - (-golden_ratio)**(-n)) / 5**(1/2)
    return int(f)


start_time = timeit.default_timer()
print(fibo_de_moivre(n))
print('>> elapsed time', (timeit.default_timer() - start_time) * 1000, 'ms')

9227465
>> elapsed time 0.2905000000001934 ms


# Example values
a, b = 104723, 104729
n = a * b
n

10967535067


# Function that returns the factorization of an integer (ascending approach)
def fact_int(n):
    nn = n**(1/2)
    m = 2
    
    while m < nn:
        if n % m == 0:
            return (m, n // m)
        m += 1
    
    return (1, n)


start_time = timeit.default_timer()
print(fact_int(n))
print('>> elapsed time', (timeit.default_timer() - start_time) * 1000, 'ms')

(104723, 104729)
>> elapsed time 82.78020000000019 ms


# Function that returns the factorization of an integer (descending approach)
def fact_int_2(n):
    nn = n**(1/2)
    m = int(nn)
    
    while m > 1:
        if n % m == 0:
            return (m, n // m)
        m -= 1
    
    return (1, n)


start_time = timeit.default_timer()
print(fact_int_2(n))
print('>> elapsed time', (timeit.default_timer() - start_time) * 1000, 'ms')

(104723, 104729)
>> elapsed time 0.9137999999992985 ms


# Disk number between 2 and 64 (not recommended)
n_disks = 5


# Move n disk from source to destination
def hanoi_rec(n, source, aux, target):
    if n > 0:
        hanoi_rec(n - 1, source, target, aux)
        print('Move disk', n, 'from:', source, 'to:', target)
        hanoi_rec(n - 1, aux, source, target)


start_time = timeit.default_timer()
print('>> number of movements:', (2**n_disks - 1))
hanoi_rec(n_disks, 'T1', 'T2', 'T3')
print('>> elapsed time', (timeit.default_timer() - start_time) * 1000, 'ms')

>> number of movements: 31
Move disk 1 from: T1 to: T3
Move disk 2 from: T1 to: T2
Move disk 1 from: T3 to: T2
Move disk 3 from: T1 to: T3
Move disk 1 from: T2 to: T1
Move disk 2 from: T2 to: T3
Move disk 1 from: T1 to: T3
Move disk 4 from: T1 to: T2
Move disk 1 from: T3 to: T2
Move disk 2 from: T3 to: T1
Move disk 1 from: T2 to: T1
Move disk 3 from: T3 to: T2
Move disk 1 from: T1 to: T3
Move disk 2 from: T1 to: T2
Move disk 1 from: T3 to: T2
Move disk 5 from: T1 to: T3
Move disk 1 from: T2 to: T1
Move disk 2 from: T2 to: T3
Move disk 1 from: T1 to: T3
Move disk 3 from: T2 to: T1
Move disk 1 from: T3 to: T2
Move disk 2 from: T3 to: T1
Move disk 1 from: T2 to: T1
Move disk 4 from: T2 to: T3
Move disk 1 from: T1 to: T3
Move disk 2 from: T1 to: T2
Move disk 1 from: T3 to: T2
Move disk 3 from: T1 to: T3
Move disk 1 from: T2 to: T1
Move disk 2 from: T2 to: T3
Move disk 1 from: T1 to: T3
>> elapsed time 17.174699999999987 ms


# Move n disk from source to destination
def hanoi_iter(n, source, aux, target):
    n_movements = 2**n_disks - 1
    print('>> number of movements:', n_movements)

    tw_src = []
    for i in range(n_disks, 0, -1):
        tw_src.append(i)
    
    labels = [source, aux, target]
    towers = [tw_src, [], []]
    indexes = cycle([0, 1, 2] if n % 2 == 0 else [0, 2, 1])
    temp = next(indexes)
    disk = 0
    
    for i in range(1, n_movements + 1):
        if i % 2 == 1:
            disk = 1
            s, t = temp, next(indexes)
            temp = t
            towers[t].append(towers[s].pop())
            print('Move disk', disk, 'from:', labels[s], 'to:', labels[t])
        else:
            i_t2, i_t3 = [i for i in range(3) if i != temp]
            v_t2 = towers[i_t2][len(towers[i_t2]) - 1] if len(towers[i_t2]) else math.inf
            v_t3 = towers[i_t3][len(towers[i_t3]) - 1] if len(towers[i_t3]) else math.inf
            
            if v_t2 < v_t3:
                s, t = i_t2, i_t3
            else:
                s, t = i_t3, i_t2
            
            disk = towers[s].pop()
            towers[t].append(disk)
            print('Move disk', disk, 'from:', labels[s], 'to:', labels[t])


start_time = timeit.default_timer()
hanoi_iter(n_disks, 'T1', 'T2', 'T3')
print('>> elapsed time', (timeit.default_timer() - start_time) * 1000, 'ms')

>> number of movements: 31
Move disk 1 from: T1 to: T3
Move disk 2 from: T1 to: T2
Move disk 1 from: T3 to: T2
Move disk 3 from: T1 to: T3
Move disk 1 from: T2 to: T1
Move disk 2 from: T2 to: T3
Move disk 1 from: T1 to: T3
Move disk 4 from: T1 to: T2
Move disk 1 from: T3 to: T2
Move disk 2 from: T3 to: T1
Move disk 1 from: T2 to: T1
Move disk 3 from: T3 to: T2
Move disk 1 from: T1 to: T3
Move disk 2 from: T1 to: T2
Move disk 1 from: T3 to: T2
Move disk 5 from: T1 to: T3
Move disk 1 from: T2 to: T1
Move disk 2 from: T2 to: T3
Move disk 1 from: T1 to: T3
Move disk 3 from: T2 to: T1
Move disk 1 from: T3 to: T2
Move disk 2 from: T3 to: T1
Move disk 1 from: T2 to: T1
Move disk 4 from: T2 to: T3
Move disk 1 from: T1 to: T3
Move disk 2 from: T1 to: T2
Move disk 1 from: T3 to: T2
Move disk 3 from: T1 to: T3
Move disk 1 from: T2 to: T1
Move disk 2 from: T2 to: T3
Move disk 1 from: T1 to: T3
>> elapsed time 15.435800000000555 ms


# Bubble-sort: non-efficient sorting algorithm
def bubble_sort(array):
    n = len(array)
    for i in range(n):
        for j in range(0, n-i-1):
            if array[j] > array[j+1]:
                array[j], array[j+1] = array[j+1], array[j]
    
    return array


# Example values
n = 100
raw_data = []
for i in range(n):
    raw_data.append(int(random.random() * n))


# Sorting data
sorted_data = bubble_sort(raw_data.copy())


# Plotting
fig = plt.figure(figsize = (16, 8))
fig.subplots_adjust(hspace = 0.15, wspace = 0.15)

# Plotting results before sorting
plt.subplot(1, 2, 1)
plt.plot(raw_data, linewidth=0, marker="o", markersize=3, color="#3366cc")
plt.title("Data Before Sorting", fontsize = 14)
plt.ylabel('Value')
plt.xlabel('Index')

# Plotting results after sorting
plt.subplot(1, 2, 2)
plt.plot(sorted_data, linewidth=0, marker="o", markersize=3, color="#109618")
plt.title("Data After Sorting", fontsize = 14)
plt.ylabel('Value')
plt.xlabel('Index')
plt.show()


# Validation values
x_data = [0]
diff_raw_data = [0]
diff_sorted_data = [0]

for i in range(1, n):
    x_data.append(i)
    diff_raw_data.append(raw_data[i] - raw_data[i-1])
    diff_sorted_data.append(sorted_data[i] - sorted_data[i-1])


# Showing gap differences
raw_sum_abs = sum([abs(v) for v in diff_raw_data])
sorted_sum_abs = sum([abs(v) for v in diff_sorted_data])

print('Raw data - Gap sum:', raw_sum_abs)
print('Sorted data - Gap sum:', sorted_sum_abs)

Raw data - Gap sum: 3085
Sorted data - Gap sum: 95


# Plotting
fig = plt.figure(figsize = (16, 8))
fig.subplots_adjust(hspace = 0.15, wspace = 0.15)

# Plotting results before sorting
plt.subplot(1, 2, 1)
plt.step(x_data, diff_raw_data, where='mid', color="#3366cc", alpha=0.6)
plt.plot(diff_raw_data, linewidth=0, marker="o", markersize=3, color="#3366cc")
plt.title("Differences between Raw points", fontsize = 14)
plt.ylabel('Diff')
plt.xlabel('Index')

# Plotting results after sorting
plt.subplot(1, 2, 2)
plt.step(x_data, diff_sorted_data, where='mid', color="#109618", alpha=0.6)
plt.plot(diff_sorted_data, linewidth=0, marker="o", markersize=3, color="#109618")
plt.title("Differences between Sorted points", fontsize = 14)
plt.ylabel('Diff')
plt.xlabel('Index')
plt.show()


# Calculate variance of the residuals
stats.stdev(diff_raw_data)

39.243877473969356


# Calculate variance of the residuals
stats.stdev(diff_sorted_data)

1.0952145677879515


# Example values
n = 1000
points = []

for i in range(n):
    x = int(random.random() * n)
    y = int(random.random() * n)
    points.append((x, y))

points = np.array(points)


# Returns the convex hull, assuming that each points[i] <= points[i + 1]. Runs in O(n) time
def make_hull_presorted(points):
    if len(points) <= 1:
        return list(points)
    
    # Andrew's monotone chain algorithm
    upperhull = []
    lowerhull = []
    for hull in (upperhull, lowerhull):
        for p in (points if (hull is upperhull) else reversed(points)):
            while len(hull) >= 2:
                qx, qy = hull[-1]
                rx, ry = hull[-2]
                if (qx - rx) * (p[1] - ry) >= (qy - ry) * (p[0] - rx):
                    del hull[-1]
                else:
                    break
            hull.append(p)
        del hull[-1]
    
    if not (len(upperhull) == 1 and upperhull == lowerhull):
        upperhull.extend(lowerhull)
    
    return upperhull

# This algorithm runs in O(n log n) time
def convex_hull_greedy(points):
    sorted_points = sorted(points, key = lambda p: p[0])
    hull = make_hull_presorted(sorted_points)
    hull.append(hull[0])
    return hull


# Run algorithm
start_time = timeit.default_timer()
hull = convex_hull_greedy(points)
print('>> elapsed time', (timeit.default_timer() - start_time) * 1000, 'ms')

>> elapsed time 42.057800000000256 ms


# Plotting convex hull results
plt.figure(figsize = (8, 8))
plt.plot(points[:,0], points[:,1], linewidth=0, marker="o", markersize=2, color="black")
for i in range(1, len(hull)):
    p1 = hull[i-1]
    p2 = hull[i]
    plt.plot([p1[0], p2[0]], [p1[1], p2[1]], color="#3366cc")

plt.title("Convex Hull - Iterative", fontsize = 14)
plt.ylabel('y')
plt.xlabel('x')
plt.show()


# Initialize variables
n = 256
data_raw = [25] * n
total = sum(data_raw)
print('Total values:', total)

Total values: 6400


# Creating target distribution
alpha = 0.02
t_func = sci.norm(n/2, alpha*n)
x = np.linspace(0, n, n)
y = t_func.pdf(x) * total


# Create pretty x axis labels
def get_x_labels(n):
    x_labels = []
    for ix in range(n):
        if ix % 10 == 0:
            x_labels.append(str(ix))
        else:
            x_labels.append('')
    return x_labels


# Function that plots a symbol distribution
def plot_symbol_dist(data, x, y):
    
    # Prepare data
    n = len(data)
    y_pos = np.arange(n)
    symbols = get_x_labels(n)
    
    # Plot distribution
    plt.figure(figsize = (12, 5))
    plt.plot(x, y, '-', color = '#ff7f0e', lw = 3, label = 'Real distribution')
    plt.bar(y_pos, data, align='center', alpha=0.5)
    plt.xticks(y_pos, symbols, fontsize = 10, rotation = 50)
    plt.ylabel('Value')
    plt.title('Distribution')
    plt.show()


# Plot current distribution
plot_symbol_dist(data_raw, x, y)


# Function that calculates the new distribution
def get_new_dist(data_raw, y):
    a = []
    b = []
    n = len(data_raw)
    
    carry = 0
    for i in range(n // 2):
        y1 = data_raw[i] + carry
        y2 = max(math.floor(y[i]), 1)
        y_new = min(y1, y2)
        a.append(y_new)
        carry = y1 - y_new
    print('Forward carry:', carry)
    
    for i in range(n - 1, n // 2 - 1, -1):
        y1 = data_raw[i] + carry
        y2 = max(math.floor(y[i]), 1)
        y_new = min(y1, y2)
        b.append(y_new)
        carry = y1 - y_new    
    print('backward carry:', carry)
    
    # Concatenate arrays
    data_new = a + b[::-1]
    return data_new


data_new = get_new_dist(data_raw, y)
print('n temp:', len(data_new))

Forward carry: 0
backward carry: 0
n temp: 256


plot_symbol_dist(data_new, x, y)


# Difference between distributions
print('>> diff:', total - sum(data_new))

>> diff: 0

1. Algorithm's Basics¶

Algorithms¶

1.1. Greatest Common Divisor (GCD)¶

1.1.1. Simple approach¶

1.1.2. Enhanced approach¶

1.2. Fibonacci Serie¶

1.2.1. Recursive algorithm¶

1.2.2. Iterative algorithm¶

1.2.3. Approximation approach¶

1.3. Integer Factorization¶

1.4. Tower of Hanoi¶

1.4.1. The recursive and classic algorithm¶

1.4.2. Iterative algorithm¶

1.5. Sorting Algorithm¶

1.6. Convex Hull¶

1.7. Changing Distribution¶

Creating a toy uniform distribution¶

Calculate and plot new (Normal) distribution¶

References¶