From 51943bbef3c7fd6aa25ad858452b045939ac3487 Mon Sep 17 00:00:00 2001 From: Manos Katsomallos Date: Mon, 26 Jul 2021 17:22:02 +0300 Subject: [PATCH] lmdk_bgt.incremental: Initial commit --- code/lib/lmdk_bgt.py | 61 ++++++++++++++++++++++++++++++++++++++++++++ 1 file changed, 61 insertions(+) diff --git a/code/lib/lmdk_bgt.py b/code/lib/lmdk_bgt.py index a12bb37..b8e0b9f 100644 --- a/code/lib/lmdk_bgt.py +++ b/code/lib/lmdk_bgt.py @@ -467,6 +467,67 @@ def discount(seq, lmdks, epsilon): return rls_data, bgts, skipped +def incremental(seq, lmdks, epsilon, diff_rt): + ''' + Incremental sampling. + + Parameters: + seq - The point sequence. + lmdks - The landmarks. + epsilon - The available privacy budget. + diff_rt - Sampling rate difference. + Returns: + rls_data - The perturbed data. + bgts - The privacy budget allocation. + skipped - The number of skipped releases. + ''' + # Uniform budget allocation + bgts = uniform(seq, lmdks, epsilon) + # Released + rls_data = [None]*len(seq) + # The sampling rate + # (publish with 50% chance) + samp_rt = .5 + # Track landmarks + lmdk_cur = 0 + # Track consecutive landmarks + lmdk_con = 0 + # Track skipped releases + skipped = 0 + for i, p in enumerate(seq): + # Check if current point is a landmark + if lmdk_lib.is_landmark(p, lmdks): + lmdk_cur += 1 + # Increase sampling rate + samp_rt += (1 - samp_rt)*diff_rt + else: + # Decrease sampling rate + samp_rt -= samp_rt*diff_rt + # Get coordinates + loc = (p[1], p[2]) + if i == 0 or lmdk_lib.should_sample(samp_rt): + # Add noise to original data + new_loc = lmdk_lib.add_polar_noise(loc, bgts[i]) + rls_data[i] = [p[0], new_loc[0], new_loc[1], p[3]] + # Adjust sampling rate + if lmdk_lib.is_landmark(p, lmdks): + # Adjust consecutive landmarks tracking + lmdk_con += 1 + else: + skipped += 1 + # Skip current release and approximate with previous + rls_data[i] = rls_data[i - 1] + if lmdk_lib.is_landmark(p, lmdks): + # Reset consecutive landmarks tracking + lmdk_con = 0 + # Allocate the current budget to the following releases uniformly + for j in range(i + 1, len(seq)): + bgts[j] += bgts[i]/(len(lmdks) - lmdk_cur + 1) + # No budget was spent + bgts[i] = 0 + return rls_data, bgts, skipped + + def uniform_r(seq, lmdks, epsilon): # Released rls_data = [None]*len(seq)