/*
* Licensed to the Apache Software Foundation (ASF) under one or more
* contributor license agreements. See the NOTICE file distributed with
* this work for additional information regarding copyright ownership.
* The ASF licenses this file to You under the Apache License, Version 2.0
* (the "License"); you may not use this file except in compliance with
* the License. You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package gobblin.data.management.retention.policy;
import java.util.Collection;
import java.util.List;
import java.util.Properties;
import lombok.extern.slf4j.Slf4j;
import org.joda.time.DateTime;
import org.joda.time.Duration;
import org.joda.time.format.ISOPeriodFormat;
import com.google.common.base.Optional;
import com.google.common.base.Preconditions;
import com.google.common.base.Predicate;
import com.google.common.collect.Collections2;
import com.google.common.collect.Lists;
import com.typesafe.config.Config;
import gobblin.data.management.retention.DatasetCleaner;
import gobblin.data.management.version.DatasetVersion;
import gobblin.data.management.version.TimestampedDatasetVersion;
import gobblin.util.ConfigUtils;
/**
* Retain dataset versions newer than now - {@link #retention}.
*/
@Slf4j
public class TimeBasedRetentionPolicy implements RetentionPolicy<TimestampedDatasetVersion> {
public static final String RETENTION_MINUTES_KEY = DatasetCleaner.CONFIGURATION_KEY_PREFIX + "minutes.retained";
// ISO8601 Standard PyYmMwWdDThHmMsS
public static final String RETENTION_TIMEBASED_DURATION_KEY =
DatasetCleaner.CONFIGURATION_KEY_PREFIX + "timebased.duration";
private final Duration retention;
public TimeBasedRetentionPolicy(Properties props) {
this(ConfigUtils.propertiesToConfig(props));
}
/**
* Creates a new {@link TimeBasedRetentionPolicy} using {@link #RETENTION_TIMEBASED_DURATION_KEY} in the
* <code>config</code>
* <ul> Some Example values for {@link #RETENTION_TIMEBASED_DURATION_KEY} are
* <li> P20D = 20 Days
* <li> P20H = 20 Hours
* <li> P2Y = 2 Years
* <li> P2Y3M = 2 Years and 3 Months
* <li> PT23M = 23 Minutes (Note this is different from P23M which is 23 Months)
* </ul>
*
* @param config that holds retention duration in ISO8061 format at key {@link #RETENTION_TIMEBASED_DURATION_KEY}.
*/
public TimeBasedRetentionPolicy(Config config) {
this.retention = getDuration(config);
log.info(String.format("%s will delete dataset versions older than %s.", TimeBasedRetentionPolicy.class.getName(),
this.retention.toString()));
}
public TimeBasedRetentionPolicy(String duration) {
this.retention = parseDuration(duration);
log.info(String
.format("%s will delete dataset versions older than %s.", TimeBasedRetentionPolicy.class.getName(), duration));
}
@Override
public Class<? extends DatasetVersion> versionClass() {
return TimestampedDatasetVersion.class;
}
@Override
public Collection<TimestampedDatasetVersion> listDeletableVersions(List<TimestampedDatasetVersion> allVersions) {
return Lists.newArrayList(Collections2.filter(allVersions, new Predicate<DatasetVersion>() {
@Override
public boolean apply(DatasetVersion version) {
return ((TimestampedDatasetVersion) version).getDateTime().plus(TimeBasedRetentionPolicy.this.retention)
.isBeforeNow();
}
}));
}
/**
* Since months and years can have arbitrary days, joda time does not allow conversion of a period string containing
* months or years to a duration. Hence we calculate the duration using 1970 01:01:00:00:00 UTC as a reference time.
*
* <p>
* <code>
* (1970 01:01:00:00:00 + P2Y) - 1970 01:01:00:00:00 = Duration for 2 years
* </code>
* </p>
*
* @param periodString
* @return duration for this period.
*/
private static Duration parseDuration(String periodString) {
DateTime zeroEpoc = new DateTime(0);
return new Duration(zeroEpoc, zeroEpoc.plus(ISOPeriodFormat.standard().parsePeriod(periodString)));
}
private static Duration getDuration(Config config) {
Preconditions
.checkArgument(config.hasPath(RETENTION_TIMEBASED_DURATION_KEY) || config.hasPath(RETENTION_MINUTES_KEY),
String.format("Either %s or %s needs to be set", RETENTION_TIMEBASED_DURATION_KEY, RETENTION_MINUTES_KEY));
if (config.hasPath(RETENTION_TIMEBASED_DURATION_KEY)) {
return parseDuration(config.getString(RETENTION_TIMEBASED_DURATION_KEY));
} else {
return Duration.standardMinutes(Long.parseLong(config.getString(RETENTION_MINUTES_KEY)));
}
}
}