| // |
| // Copyright 2020 Google LLC |
| // |
| // Licensed under the Apache License, Version 2.0 (the "License"); |
| // you may not use this file except in compliance with the License. |
| // You may obtain a copy of the License at |
| // |
| // http://www.apache.org/licenses/LICENSE-2.0 |
| // |
| // Unless required by applicable law or agreed to in writing, software |
| // distributed under the License is distributed on an "AS IS" BASIS, |
| // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. |
| // See the License for the specific language governing permissions and |
| // limitations under the License. |
| // |
| |
| package com.google.privacy.differentialprivacy.example; |
| |
| import com.google.privacy.differentialprivacy.BoundedSum; |
| import java.time.DayOfWeek; |
| import java.util.EnumMap; |
| import java.util.HashMap; |
| import java.util.Map; |
| |
| /** |
| * Similar to {@link SumRevenuePerDay} but a visitor may enter the restaurant multiple times a day. |
| */ |
| public class SumRevenuePerDayWithPreAggregation { |
| private static final String NON_PRIVATE_OUTPUT = "non_private_sums_per_day_w_preaggregation.csv"; |
| private static final String PRIVATE_OUTPUT = "private_sums_per_day_w_preaggregatio.csv"; |
| |
| private static final double LN_3 = Math.log(3); |
| |
| /** |
| * Number of visit days contributed by a single visitor will be limited to 4. All exceeding |
| * visits will be discarded. |
| */ |
| private static final int MAX_CONTRIBUTED_DAYS = 4; |
| /** Minimum amount of money we expect a visitor to spend on a single visit. */ |
| private static final int MIN_EUROS_SPENT = 0; |
| /** Maximum amount of money we expect a visitor to spend on a single visit. */ |
| private static final int MAX_EUROS_SPENT = 65; |
| |
| private SumRevenuePerDayWithPreAggregation() { } |
| |
| /** |
| * Similar to {@link SumRevenuePerDay#run} but pre-aggregates visitor spending per day when |
| * calculating private revenue. |
| */ |
| public static void run() { |
| VisitsForWeek visitsForWeek = IOUtils.readWeeklyVisits(InputFilePath.WEEK_STATISTICS); |
| |
| EnumMap<DayOfWeek, Integer> nonPrivateSums = getNonPrivateSums(visitsForWeek); |
| EnumMap<DayOfWeek, Integer> privateSums = getPrivateSums(visitsForWeek); |
| |
| IOUtils.writeCountsPerDayOfWeek(nonPrivateSums, NON_PRIVATE_OUTPUT); |
| IOUtils.writeCountsPerDayOfWeek(privateSums, PRIVATE_OUTPUT); |
| } |
| |
| /** Returns total raw revenue for each day of the week. */ |
| private static EnumMap<DayOfWeek, Integer> getNonPrivateSums(VisitsForWeek visits) { |
| return SumRevenuePerDay.getNonPrivateSums(visits); |
| } |
| |
| /** Returns total anonymized revenue for each day of the week. */ |
| private static EnumMap<DayOfWeek, Integer> getPrivateSums(VisitsForWeek visits) { |
| EnumMap<DayOfWeek, Integer> privateSumsPerDay = new EnumMap<>(DayOfWeek.class); |
| |
| // Pre-process the data set: limit the number of visits to MAX_CONTRIBUTED_DAYS |
| // per visitorId. |
| VisitsForWeek boundedVisits = |
| ContributionBoundingUtils.boundContributedDays(visits, MAX_CONTRIBUTED_DAYS); |
| |
| for (DayOfWeek d : DayOfWeek.values()) { |
| BoundedSum dpSum = |
| BoundedSum.builder() |
| .epsilon(LN_3) |
| // The data was pre-processed so that each visitor may visit the restaurant up to |
| // MAX_CONTRIBUTED_DAYS days per week. |
| // Hence, each user may contribute to up to MAX_CONTRIBUTED_DAYS daily counts. |
| // Note: while the library accepts this limit as a configurable parameter, |
| // it doesn't pre-process the data to ensure this limit is respected. |
| // It is responsibility of the caller to ensure the data passed to the library |
| // is capped for getting the correct privacy guarantee. |
| .maxPartitionsContributed(MAX_CONTRIBUTED_DAYS) |
| // No need to pre-process the data: BoundedSum will clamp the input values. |
| .lower(MIN_EUROS_SPENT) |
| .upper(MAX_EUROS_SPENT) |
| .build(); |
| |
| // For each visitor, pre-aggregate their spending for the day. |
| Map<String, Integer> visitorToDaySpending = new HashMap<>(); |
| for (Visit v : boundedVisits.getVisitsForDay(d)) { |
| String visitorId = v.visitorId(); |
| if (visitorToDaySpending.containsKey(visitorId)) { |
| int newAmount = visitorToDaySpending.get(visitorId) + v.eurosSpent(); |
| visitorToDaySpending.put(visitorId, newAmount); |
| } else { |
| visitorToDaySpending.put(visitorId, v.eurosSpent()); |
| } |
| } |
| |
| for (Integer visitorSpending : visitorToDaySpending.values()) { |
| dpSum.addEntry(visitorSpending); |
| } |
| |
| privateSumsPerDay.put(d, (int) dpSum.computeResult()); |
| } |
| |
| return privateSumsPerDay; |
| } |
| } |