package org.apache.lucene.document; /** * Licensed to the Apache Software Foundation (ASF) under one or more * contributor license agreements. See the NOTICE file distributed with * this work for additional information regarding copyright ownership. * The ASF licenses this file to You under the Apache License, Version 2.0 * (the "License"); you may not use this file except in compliance with * the License. You may obtain a copy of the License at * * http://www.apache.org/licenses/LICENSE-2.0 * * Unless required by applicable law or agreed to in writing, software * distributed under the License is distributed on an "AS IS" BASIS, * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. * See the License for the specific language governing permissions and * limitations under the License. */ import java.text.ParseException; import java.text.SimpleDateFormat; import java.util.Calendar; import java.util.Date; import java.util.TimeZone; import java.util.Locale; import org.apache.lucene.search.NumericRangeQuery; // for javadocs import org.apache.lucene.util.NumericUtils; // for javadocs /** * Provides support for converting dates to strings and vice-versa. * The strings are structured so that lexicographic sorting orders * them by date, which makes them suitable for use as field values * and search terms. * * <P>This class also helps you to limit the resolution of your dates. Do not * save dates with a finer resolution than you really need, as then * RangeQuery and PrefixQuery will require more memory and become slower. * * <P> * Another approach is {@link NumericUtils}, which provides * a sortable binary representation (prefix encoded) of numeric values, which * date/time are. * For indexing a {@link Date} or {@link Calendar}, just get the unix timestamp as * <code>long</code> using {@link Date#getTime} or {@link Calendar#getTimeInMillis} and * index this as a numeric value with {@link NumericField} * and use {@link NumericRangeQuery} to query it. */ public class DateTools { private static final class DateFormats { final static TimeZone GMT = TimeZone.getTimeZone("GMT"); final SimpleDateFormat YEAR_FORMAT = new SimpleDateFormat("yyyy", Locale.US); final SimpleDateFormat MONTH_FORMAT = new SimpleDateFormat("yyyyMM", Locale.US); final SimpleDateFormat DAY_FORMAT = new SimpleDateFormat("yyyyMMdd", Locale.US); final SimpleDateFormat HOUR_FORMAT = new SimpleDateFormat("yyyyMMddHH", Locale.US); final SimpleDateFormat MINUTE_FORMAT = new SimpleDateFormat("yyyyMMddHHmm", Locale.US); final SimpleDateFormat SECOND_FORMAT = new SimpleDateFormat("yyyyMMddHHmmss", Locale.US); final SimpleDateFormat MILLISECOND_FORMAT = new SimpleDateFormat("yyyyMMddHHmmssSSS", Locale.US); { // times need to be normalized so the value doesn't depend on the // location the index is created/used: YEAR_FORMAT.setTimeZone(GMT); MONTH_FORMAT.setTimeZone(GMT); DAY_FORMAT.setTimeZone(GMT); HOUR_FORMAT.setTimeZone(GMT); MINUTE_FORMAT.setTimeZone(GMT); SECOND_FORMAT.setTimeZone(GMT); MILLISECOND_FORMAT.setTimeZone(GMT); } final Calendar calInstance = Calendar.getInstance(GMT, Locale.US); } private static final ThreadLocal<DateFormats> FORMATS = new ThreadLocal<DateFormats>() { @Override protected DateFormats initialValue() { return new DateFormats(); } }; // cannot create, the class has static methods only private DateTools() {} /** * Converts a Date to a string suitable for indexing. * * @param date the date to be converted * @param resolution the desired resolution, see * {@link #round(Date, DateTools.Resolution)} * @return a string in format <code>yyyyMMddHHmmssSSS</code> or shorter, * depending on <code>resolution</code>; using GMT as timezone */ public static String dateToString(Date date, Resolution resolution) { return timeToString(date.getTime(), resolution); } /** * Converts a millisecond time to a string suitable for indexing. * * @param time the date expressed as milliseconds since January 1, 1970, 00:00:00 GMT * @param resolution the desired resolution, see * {@link #round(long, DateTools.Resolution)} * @return a string in format <code>yyyyMMddHHmmssSSS</code> or shorter, * depending on <code>resolution</code>; using GMT as timezone */ public static String timeToString(long time, Resolution resolution) { final DateFormats formats = FORMATS.get(); formats.calInstance.setTimeInMillis(round(time, resolution)); final Date date = formats.calInstance.getTime(); switch (resolution) { case YEAR: return formats.YEAR_FORMAT.format(date); case MONTH:return formats.MONTH_FORMAT.format(date); case DAY: return formats.DAY_FORMAT.format(date); case HOUR: return formats.HOUR_FORMAT.format(date); case MINUTE: return formats.MINUTE_FORMAT.format(date); case SECOND: return formats.SECOND_FORMAT.format(date); case MILLISECOND: return formats.MILLISECOND_FORMAT.format(date); } throw new IllegalArgumentException("unknown resolution " + resolution); } /** * Converts a string produced by <code>timeToString</code> or * <code>dateToString</code> back to a time, represented as the * number of milliseconds since January 1, 1970, 00:00:00 GMT. * * @param dateString the date string to be converted * @return the number of milliseconds since January 1, 1970, 00:00:00 GMT * @throws ParseException if <code>dateString</code> is not in the * expected format */ public static long stringToTime(String dateString) throws ParseException { return stringToDate(dateString).getTime(); } /** * Converts a string produced by <code>timeToString</code> or * <code>dateToString</code> back to a time, represented as a * Date object. * * @param dateString the date string to be converted * @return the parsed time as a Date object * @throws ParseException if <code>dateString</code> is not in the * expected format */ public static Date stringToDate(String dateString) throws ParseException { final DateFormats formats = FORMATS.get(); if (dateString.length() == 4) { return formats.YEAR_FORMAT.parse(dateString); } else if (dateString.length() == 6) { return formats.MONTH_FORMAT.parse(dateString); } else if (dateString.length() == 8) { return formats.DAY_FORMAT.parse(dateString); } else if (dateString.length() == 10) { return formats.HOUR_FORMAT.parse(dateString); } else if (dateString.length() == 12) { return formats.MINUTE_FORMAT.parse(dateString); } else if (dateString.length() == 14) { return formats.SECOND_FORMAT.parse(dateString); } else if (dateString.length() == 17) { return formats.MILLISECOND_FORMAT.parse(dateString); } throw new ParseException("Input is not valid date string: " + dateString, 0); } /** * Limit a date's resolution. For example, the date <code>2004-09-21 13:50:11</code> * will be changed to <code>2004-09-01 00:00:00</code> when using * <code>Resolution.MONTH</code>. * * @param resolution The desired resolution of the date to be returned * @return the date with all values more precise than <code>resolution</code> * set to 0 or 1 */ public static Date round(Date date, Resolution resolution) { return new Date(round(date.getTime(), resolution)); } /** * Limit a date's resolution. For example, the date <code>1095767411000</code> * (which represents 2004-09-21 13:50:11) will be changed to * <code>1093989600000</code> (2004-09-01 00:00:00) when using * <code>Resolution.MONTH</code>. * * @param resolution The desired resolution of the date to be returned * @return the date with all values more precise than <code>resolution</code> * set to 0 or 1, expressed as milliseconds since January 1, 1970, 00:00:00 GMT */ public static long round(long time, Resolution resolution) { final Calendar calInstance = FORMATS.get().calInstance; calInstance.setTimeInMillis(time); switch (resolution) { case YEAR: calInstance.set(Calendar.MONTH, 0); calInstance.set(Calendar.DAY_OF_MONTH, 1); calInstance.set(Calendar.HOUR_OF_DAY, 0); calInstance.set(Calendar.MINUTE, 0); calInstance.set(Calendar.SECOND, 0); calInstance.set(Calendar.MILLISECOND, 0); break; case MONTH: calInstance.set(Calendar.DAY_OF_MONTH, 1); calInstance.set(Calendar.HOUR_OF_DAY, 0); calInstance.set(Calendar.MINUTE, 0); calInstance.set(Calendar.SECOND, 0); calInstance.set(Calendar.MILLISECOND, 0); break; case DAY: calInstance.set(Calendar.HOUR_OF_DAY, 0); calInstance.set(Calendar.MINUTE, 0); calInstance.set(Calendar.SECOND, 0); calInstance.set(Calendar.MILLISECOND, 0); break; case HOUR: calInstance.set(Calendar.MINUTE, 0); calInstance.set(Calendar.SECOND, 0); calInstance.set(Calendar.MILLISECOND, 0); break; case MINUTE: calInstance.set(Calendar.SECOND, 0); calInstance.set(Calendar.MILLISECOND, 0); break; case SECOND: calInstance.set(Calendar.MILLISECOND, 0); break; case MILLISECOND: // don't cut off anything break; default: throw new IllegalArgumentException("unknown resolution " + resolution); } return calInstance.getTimeInMillis(); } /** Specifies the time granularity. */ public static enum Resolution { YEAR, MONTH, DAY, HOUR, MINUTE, SECOND, MILLISECOND; /** this method returns the name of the resolution * in lowercase (for backwards compatibility) */ @Override public String toString() { return super.toString().toLowerCase(Locale.ENGLISH); } } }