1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 163 164 165 166 167 168 169 170 171 172 173 174 175 176 177 178 179 180 181 182 183 184 185 186 187 188 189 190 191 192 193 194 195 196 197 198 199 200 201 202 203 204 205 206 207 208 209 210 211 212 213 214 215 216 217 218 219 220 221 222 223 224 225 226 227 228 229 230 231 232 233 234 235 236 237 238 239 240 241 242 243 244 245 246 247 248 249 250 251 252 253 254 255 256 257 258 259 260 261 262 263 264 265 266 267 268 269 270 271 272 273 274 275 276 277 278 279 280 281 282 283 284 285 286 287 288 289 290 291 292 293 294 295 296 297 298 299 300 301 302 303 304 305 306 307 308 309 310 311 312 313 314 315 316 317 318 319 320 321 322 323 324 325 326 327 328 329 330 331 332 333 334 335 336 337 338 339 340 341 342 343 344 345 346 347 348 349 350 351 352 353 354 355 356 357 358 359 360 361 362 363 364 365 366 367 368 369 370 371 372 373 374 375 376 377 378 379 380 381 382 383 384 385 386 387 388 389 390 391 392 393 394 395 396 397 398 399 400 401 402 403 404 405 406 407 408 409 410 411 412 413 414 415 416 417 418 419 420
use alloc::{string::String, sync::Arc, vec::Vec};
use crate::{error::Error, tz::TimeZone};
use self::{bundled::BundledZoneInfo, zoneinfo::ZoneInfo};
mod bundled;
mod zoneinfo;
/// Returns a copy of the global [`TimeZoneDatabase`].
///
/// This is the same database used for convenience routines like
/// [`Timestamp::intz`](crate::Timestamp::intz) and parsing routines
/// for [`Zoned`](crate::Zoned) that need to do IANA time zone identifier
/// lookups. Basically, whenever an implicit time zone database is needed,
/// it is *this* copy of the time zone database that is used.
///
/// In feature configurations where a time zone database cannot interact with
/// the file system (like when `std` is not enabled), this returns a database
/// where every lookup will fail.
///
/// # Example
///
/// ```
/// use jiff::tz;
///
/// assert!(tz::db().get("Antarctica/Troll").is_ok());
/// assert!(tz::db().get("does-not-exist").is_err());
/// ```
pub fn db() -> &'static TimeZoneDatabase {
#[cfg(not(feature = "std"))]
{
static NONE: TimeZoneDatabase = TimeZoneDatabase::none();
&NONE
}
#[cfg(feature = "std")]
{
use std::sync::OnceLock;
static DB: OnceLock<TimeZoneDatabase> = OnceLock::new();
DB.get_or_init(|| {
let db = TimeZoneDatabase::from_env();
debug!("initialized global time zone database: {db:?}");
db
})
}
}
/// A handle to a [IANA Time Zone Database].
///
/// A `TimeZoneDatabase` provides a way to lookup [`TimeZone`]s by their
/// human readable identifiers, such as `America/Los_Angeles` and
/// `Europe/Warsaw`.
///
/// It is rare to need to create or use this type directly. Routines
/// like zoned datetime parsing and time zone conversion provide
/// convenience routines for using an implicit global time zone database
/// by default. This global time zone database is available via
/// [`jiff::tz::db`](crate::tz::db()`). But lower level parsing routines
/// such as
/// [`fmt::temporal::DateTimeParser::parse_zoned_with`](crate::fmt::temporal::DateTimeParser::parse_zoned_with)
/// and
/// [`civil::DateTime::to_zoned`](crate::civil::DateTime::to_zoned) provide a
/// means to use a custom copy of a `TimeZoneDatabase`.
///
/// # Platform behavior
///
/// This behavior is subject to change.
///
/// On Unix systems, and when the `tzdb-zoneinfo` crate feature is enabled
/// (which it is by default), Jiff will read the `/usr/share/zoneinfo`
/// directory for time zone data.
///
/// On Windows systems and when the `tzdb-bundle-platform` crate feature is
/// enabled (which it is by default), _or_ when the `tzdb-bundle-always` crate
/// feature is enabled, then the `jiff-tzdb` crate will be used to embed the
/// entire Time Zone Database into the compiled artifact.
///
/// In general, using `/usr/share/zoneinfo` (or an equivalent) is heavily
/// preferred in lieu of embedding the database into your compiled artifact.
/// The reason is because your system copy of the Time Zone Database may be
/// updated, perhaps a few times a year, and it is better to get seamless
/// updates through your system rather than needing to wait on a Rust crate
/// to update and then rebuild your software. The bundling approach should
/// only be used when there is no plausible alternative. For example, Windows
/// has no canonical location for a copy of the Time Zone Database. Indeed,
/// this is why the Cargo configuration of Jiff specifically does not enabled
/// bundling by default on Unix systems, but does enable it by default on
/// Windows systems. Of course, if you really do need a copy of the database
/// bundled, then you can enable the `tzdb-bundle-always` crate feature.
///
/// # Cloning
///
/// A `TimeZoneDatabase` can be cheaply cloned. It will share a thread safe
/// cache with other copies of the same `TimeZoneDatabase`.
///
/// # Caching
///
/// Because looking up a time zone on disk, reading the file into memory
/// and parsing the time zone transitions out of that file requires
/// a fair amount of work, a `TimeZoneDatabase` does a fair bit of
/// caching. This means that the vast majority of calls to, for example,
/// [`Timestamp::intz`](crate::Timestamp::intz) don't actually need to hit
/// disk. It will just find a cached copy of a [`TimeZone`] and return that.
///
/// Of course, with caching comes problems of cache invalidation. Invariably,
/// there are parameters that Jiff uses to manage when the cache should be
/// invalidated. Jiff tries to emit log messages about this when it happens. If
/// you find the caching behavior of Jiff to be sub-optimal for your use case,
/// please create an issue. (The plan is likely to expose some options for
/// configuring the behavior of a `TimeZoneDatabase`, but I wanted to collect
/// user feedback first.)
///
/// [IANA Time Zone Database]: https://en.wikipedia.org/wiki/Tz_database
///
/// # Example: list all available time zones
///
/// ```no_run
/// use jiff::tz;
///
/// for tzid in tz::db().available() {
/// println!("{tzid}");
/// }
/// ```
///
/// # Example: using multiple time zone databases
///
/// Jiff supports opening and using multiple time zone databases by default.
/// All you need to do is point [`TimeZoneDatabase::from_dir`] to your own
/// copy of the Time Zone Database, and it will handle the rest.
///
/// This example shows how to utilize multiple databases by parsing a datetime
/// using an older copy of the IANA Time Zone Database. This example leverages
/// the fact that the 2018 copy of the database preceded Brazil's announcement
/// that daylight saving time would be abolished. This meant that datetimes
/// in the future, when parsed with the older copy of the Time Zone Database,
/// would still follow the old daylight saving time rules. But a mere update of
/// the database would otherwise change the meaning of the datetime.
///
/// This scenario can come up if one stores datetimes in the future. This is
/// also why the default offset conflict resolution strategy when parsing zoned
/// datetimes is [`OffsetConflict::Reject`](crate::tz::OffsetConflict::Reject),
/// which prevents one from silently re-interpreting datetimes to a different
/// timestamp.
///
/// ```no_run
/// use jiff::{fmt::temporal::DateTimeParser, tz::{self, TimeZoneDatabase}};
///
/// static PARSER: DateTimeParser = DateTimeParser::new();
///
/// // Open a version of tzdb from before Brazil announced its abolition
/// // of daylight saving time.
/// let tzdb2018 = TimeZoneDatabase::from_dir("path/to/tzdb-2018b")?;
/// // Open the system tzdb.
/// let tzdb = tz::db();
///
/// // Parse the same datetime string with the same parser, but using two
/// // different versions of tzdb.
/// let dt = "2020-01-15T12:00[America/Sao_Paulo]";
/// let zdt2018 = PARSER.parse_zoned_with(&tzdb2018, dt)?;
/// let zdt = PARSER.parse_zoned_with(tzdb, dt)?;
///
/// // Before DST was abolished, 2020-01-15 was in DST, which corresponded
/// // to UTC offset -02. Since DST rules applied to datetimes in the
/// // future, the 2018 version of tzdb would lead one to interpret
/// // 2020-01-15 as being in DST.
/// assert_eq!(zdt2018.offset(), tz::offset(-2));
/// // But DST was abolished in 2019, which means that 2020-01-15 was no
/// // no longer in DST. So after a tzdb update, the same datetime as above
/// // now has a different offset.
/// assert_eq!(zdt.offset(), tz::offset(-3));
///
/// // So if you try to parse a datetime serialized from an older copy of
/// // tzdb, you'll get an error under the default configuration because
/// // of `OffsetConflict::Reject`. This would succeed if you parsed it
/// // using tzdb2018!
/// assert!(PARSER.parse_zoned_with(tzdb, zdt2018.to_string()).is_err());
///
/// # Ok::<(), Box<dyn std::error::Error>>(())
/// ```
#[derive(Clone)]
pub struct TimeZoneDatabase {
inner: Option<Arc<TimeZoneDatabaseInner>>,
}
#[derive(Debug)]
struct TimeZoneDatabaseInner {
zoneinfo: ZoneInfo,
bundled: BundledZoneInfo,
}
impl TimeZoneDatabase {
/// Returns a database for which all time zone lookups fail.
///
/// # Example
///
/// ```
/// use jiff::tz::TimeZoneDatabase;
///
/// let db = TimeZoneDatabase::none();
/// assert_eq!(db.available().count(), 0);
/// ```
pub const fn none() -> TimeZoneDatabase {
TimeZoneDatabase { inner: None }
}
/// Returns a time zone database initialized from the current environment.
///
/// This routine never fails, but it may not be able to find a copy of
/// your Time Zone Database. When this happens, log messages (with some
/// at least at the `WARN` level) will be emitted. They can be viewed by
/// installing a [`log`] compatible logger such as [`env_logger`].
///
/// Typically, one does not need to call this routine directly. Instead,
/// it's done for you as part of [`jiff::tz::db`](crate::tz::db()).
///
/// Beware that calling this constructor will create a new _distinct_
/// handle from the one returned by `jiff::tz::db` with its own cache.
///
/// [`log`]: https://docs.rs/log
/// [`env_logger`]: https://docs.rs/env_logger
///
/// # Platform behavior
///
/// When the `TZDIR` environment variable is set, this will attempt to
/// open the Time Zone Database at the directory specified. Otherwise,
/// this will search a list of predefined directories for a system
/// installation of the Time Zone Database. Typically, it's found at
/// `/usr/share/zoneinfo`.
///
/// On Windows systems, under the default crate configuration, this will
/// return an embedded copy of the Time Zone Database since Windows does
/// not have a canonical installation of the Time Zone Database.
pub fn from_env() -> TimeZoneDatabase {
let zoneinfo = ZoneInfo::from_env();
let bundled = BundledZoneInfo::new();
let inner = TimeZoneDatabaseInner { zoneinfo, bundled };
TimeZoneDatabase { inner: Some(Arc::new(inner)) }
}
/// Returns a time zone database initialized from the given directory.
///
/// Unlike [`TimeZoneDatabase::from_env`], this always attempts to look for
/// a copy of the Time Zone Database at the directory given. And if it
/// fails to find one at that directory, then an error is returned.
///
/// Basically, you should use this when you need to use a _specific_
/// copy of the Time Zone Database, and use `TimeZoneDatabase::from_env`
/// when you just want Jiff to try and "do the right thing for you."
///
/// # Errors
///
/// This returns an error if the given directory does not contain a valid
/// copy of the Time Zone Database. Generally, this means a directory with
/// at least one valid TZif file.
#[cfg(feature = "std")]
pub fn from_dir<P: AsRef<std::path::Path>>(
path: P,
) -> Result<TimeZoneDatabase, Error> {
let zoneinfo = ZoneInfo::from_dir(path.as_ref())?;
let bundled = BundledZoneInfo::new();
let inner = TimeZoneDatabaseInner { zoneinfo, bundled };
Ok(TimeZoneDatabase { inner: Some(Arc::new(inner)) })
}
/// Returns a [`TimeZone`] corresponding to the IANA time zone identifier
/// given.
///
/// The lookup is performed without regard to ASCII case.
///
/// To see a list of all available time zone identifiers for this database,
/// use [`TimeZoneDatabase::available`].
///
/// # Example
///
/// ```
/// use jiff::tz;
///
/// let tz = tz::db().get("america/NEW_YORK")?;
/// assert_eq!(tz.iana_name(), Some("America/New_York"));
///
/// # Ok::<(), Box<dyn std::error::Error>>(())
/// ```
pub fn get(&self, name: &str) -> Result<TimeZone, Error> {
let inner = self
.inner
.as_deref()
.ok_or_else(|| Error::time_zone_lookup(name))?;
if let Some(tz) = inner.zoneinfo.get(name) {
trace!(
"found time zone {name} in system zoneinfo ({:?}) database",
inner.zoneinfo,
);
return Ok(tz);
}
if let Some(tz) = inner.bundled.get(name) {
trace!("found time zone {name} in bundled zoneinfo database");
return Ok(tz);
}
Err(Error::time_zone_lookup(name))
}
/// Returns a list of all available time zone identifiers from this
/// database.
///
/// Note that time zone identifiers are more of a machine readable
/// abstraction and not an end user level abstraction. Still, users
/// comfortable with configuring their system's default time zone through
/// IANA time zone identifiers are probably comfortable interacting with
/// the identifiers returned here.
///
/// # Example
///
/// ```no_run
/// use jiff::tz;
///
/// for tzid in tz::db().available() {
/// println!("{tzid}");
/// }
/// ```
pub fn available(&self) -> TimeZoneNameIter {
let Some(ref inner) = self.inner else {
return TimeZoneNameIter { it: Vec::new().into_iter() };
};
let mut all = inner.zoneinfo.available();
all.extend(inner.bundled.available());
all.sort();
all.dedup();
TimeZoneNameIter { it: all.into_iter() }
}
/// Resets the internal cache of this database.
///
/// Subsequent interactions with this database will need to re-read time
/// zone data from disk.
///
/// It might be useful to call this if you know the time zone database
/// has changed on disk and want to force Jiff to re-load it immediately
/// without spawning a new process or waiting for Jiff's internal cache
/// invalidation heuristics to kick in.
pub fn reset(&self) {
let Some(inner) = self.inner.as_deref() else { return };
inner.zoneinfo.reset();
inner.bundled.reset();
}
/// Returns true if it is known that this time zone database is empty.
///
/// When this returns true, it is guaranteed that all
/// [`TimeZoneDatabase::get`] calls will fail, and that
/// [`TimeZoneDatabase::available`] will always return an empty iterator.
///
/// Note that if this returns false, it is still possible for this database
/// to be empty.
///
/// # Example
///
/// ```
/// use jiff::tz::TimeZoneDatabase;
///
/// let db = TimeZoneDatabase::none();
/// assert!(db.is_definitively_empty());
/// ```
pub fn is_definitively_empty(&self) -> bool {
let Some(inner) = self.inner.as_deref() else { return true };
inner.zoneinfo.is_definitively_empty()
&& inner.bundled.is_definitively_empty()
}
}
impl core::fmt::Debug for TimeZoneDatabase {
fn fmt(&self, f: &mut core::fmt::Formatter) -> core::fmt::Result {
write!(f, "TimeZoneDatabase(")?;
let Some(inner) = self.inner.as_deref() else {
return write!(f, "unavailable)");
};
write!(f, "system={:?}", inner.zoneinfo)?;
if !inner.bundled.is_definitively_empty() {
write!(f, " and bundled")?;
}
write!(f, ")")?;
Ok(())
}
}
/// An iterator over the time zone identifiers in a [`TimeZoneDatabase`].
///
/// This iterator is created by [`TimeZoneDatabase::available`].
///
/// There are no guarantees about the order in which this iterator yields
/// time zone identifiers.
#[derive(Clone, Debug)]
pub struct TimeZoneNameIter {
it: alloc::vec::IntoIter<String>,
}
impl Iterator for TimeZoneNameIter {
type Item = String;
fn next(&mut self) -> Option<String> {
self.it.next()
}
}
#[cfg(test)]
mod tests {
use super::*;
/// This tests that the size of a time zone database is kept at a single
/// word.
///
/// I think it would probably be okay to make this bigger if we had a
/// good reason to, but it seems sensible to put a road-block to avoid
/// accidentally increasing its size.
#[test]
fn time_zone_database_size() {
let word = core::mem::size_of::<usize>();
assert_eq!(word, core::mem::size_of::<TimeZoneDatabase>());
}
}