the-last-thing/code/expt/lmdk_sel_cmp.py

130 lines
3.5 KiB
Python
Raw Normal View History

2021-10-06 00:43:39 +02:00
#!/usr/bin/env python3
import sys
sys.path.insert(1, '../lib')
import argparse
import lmdk_lib
import lmdk_sel
import exp_mech
import numpy as np
import os
from matplotlib import pyplot as plt
import time
def main(args):
# Privacy goal
epsilon = 1.0
# Number of timestamps
seq = lmdk_lib.get_seq(1, args.time)
# Distribution type
dist_type = np.array(range(0, 4))
# Number of landmarks
2021-10-11 04:01:08 +02:00
lmdk_n = np.array(range(0, args.time + 1, int(args.time/5)))
markers = [
'^', # Symmetric
'v', # Skewed
'D', # Bimodal
's' # Uniform
]
2021-10-06 00:43:39 +02:00
# Initialize plot
lmdk_lib.plot_init()
# Width of bars
bar_width = 1/(len(dist_type) + 1)
# The x axis
x_i = np.arange(len(lmdk_n))
x_margin = bar_width*(len(dist_type)/2 + 1)
plt.xticks(x_i, ((lmdk_n/len(seq))*100).astype(int))
plt.xlabel('Landmarks (%)') # Set x axis label.
2021-10-11 04:01:08 +02:00
# plt.xlim(x_i.min() - x_margin, x_i.max() + x_margin)
plt.xlim(x_i.min(), x_i.max())
2021-10-06 00:43:39 +02:00
# The y axis
# plt.yscale('log')
2021-10-11 04:01:08 +02:00
plt.ylim(0, 1)
plt.ylabel('Normalized Euclidean distance') # Set y axis label.
# plt.ylabel('Normalized Wasserstein distance') # Set y axis label.
2021-10-06 00:43:39 +02:00
# Bar offset
x_offset = -(bar_width/2)*(len(dist_type) - 1)
for d_i, d in enumerate(dist_type):
# Set label
label = lmdk_lib.dist_type_to_str(d)
if d_i == 1:
label = 'Skewed'
# Logging
title = label + ' landmark distribution'
print('(%d/%d) %s... ' %(d_i + 1, len(dist_type), title), end='', flush=True)
mae = np.zeros(len(lmdk_n))
for n_i, n in enumerate(lmdk_n):
# Skip the last one
if n_i == len(lmdk_n) - 1:
break
2021-10-11 04:01:08 +02:00
for r in range(args.iter):
2021-10-06 00:43:39 +02:00
lmdks = lmdk_lib.get_lmdks(seq, n, d)
hist, h = lmdk_lib.get_hist(seq, lmdks)
opts = lmdk_sel.get_opts_from_top_h(seq, lmdks)
delta = 1.0
res, _ = exp_mech.exponential(hist, opts, exp_mech.score, delta, epsilon)
2021-10-11 04:01:08 +02:00
mae[n_i] += lmdk_lib.get_norm(hist, res)/args.iter # Euclidean
# mae[n_i] += lmdk_lib.get_emd(hist, res)/args.iter # Wasserstein
2021-10-13 09:03:36 +02:00
# Rescaling (min-max normalization)
# https://en.wikipedia.org/wiki/Feature_scaling#Rescaling_(min-max_normalization)
mae = (mae - mae.min())/(mae.max() - mae.min())
2021-10-06 00:43:39 +02:00
print('[OK]', flush=True)
2021-10-13 09:03:36 +02:00
# Plot bar for current distribution
2021-10-11 04:01:08 +02:00
plt.plot(
x_i,
2021-10-06 00:43:39 +02:00
mae,
label=label,
2021-10-11 04:01:08 +02:00
marker=markers[d_i],
markersize=lmdk_lib.marker_size,
markeredgewidth=0,
2021-10-06 00:43:39 +02:00
linewidth=lmdk_lib.line_width
)
2021-10-11 04:01:08 +02:00
path = str('../../rslt/lmdk_sel_cmp/' + 'lmdk_sel_cmp-norm-l')
# path = str('../../rslt/lmdk_sel_cmp/' + 'lmdk_sel_cmp-emd-l')
2021-10-06 00:43:39 +02:00
# Plot legend
lmdk_lib.plot_legend()
# Show plot
# plt.show()
# Save plot
lmdk_lib.save_plot(path + '.pdf')
'''
Parse arguments.
Optional:
2021-10-11 04:01:08 +02:00
iter - The number of iterations.
2021-10-06 00:43:39 +02:00
time - The time limit of the sequence.
'''
def parse_args():
# Create argument parser.
parser = argparse.ArgumentParser()
# Mandatory arguments.
# Optional arguments.
2021-10-11 04:01:08 +02:00
parser.add_argument('-i', '--iter', help='The number of iterations.', type=int, default=1)
2021-10-06 00:43:39 +02:00
parser.add_argument('-t', '--time', help='The time limit of the sequence.', type=int, default=100)
# Parse arguments.
args = parser.parse_args()
return args
if __name__ == '__main__':
try:
start_time = time.time()
main(parse_args())
end_time = time.time()
print('##############################')
print('Time elapsed: %s' % (time.strftime('%H:%M:%S', time.gmtime(end_time - start_time))))
print('##############################')
except KeyboardInterrupt:
print('Interrupted by user.')
exit()