Seek zone abbreviations in the IANA data before timezone_abbreviations.

author Tom Lane <tgl@sss.pgh.pa.us>

Thu, 16 Jan 2025 19:11:19 +0000 (14:11 -0500)

committer Tom Lane <tgl@sss.pgh.pa.us>

Thu, 16 Jan 2025 19:11:19 +0000 (14:11 -0500)
author Tom Lane <tgl@sss.pgh.pa.us>
Thu, 16 Jan 2025 19:11:19 +0000 (14:11 -0500)
committer Tom Lane <tgl@sss.pgh.pa.us>
Thu, 16 Jan 2025 19:11:19 +0000 (14:11 -0500)
diff --git a/doc/src/sgml/config.sgml b/doc/src/sgml/config.sgml

index 3f41a17b1fe7ba079a2187e303837501ad78adde..a8866292d46052e4e5227c3fe42b9e9abb7b2d7d 100644 (file)
--- a/doc/src/sgml/config.sgml
+++ b/doc/src/sgml/config.sgml
@@ -10054,8 +10054,10 @@ SET XML OPTION { DOCUMENT | CONTENT };
        </term>
        <listitem>
         <para>
-        Sets the collection of time zone abbreviations that will be accepted
-        by the server for datetime input.  The default is <literal>'Default'</literal>,
+        Sets the collection of additional time zone abbreviations that
+        will be accepted by the server for datetime input (beyond any
+        abbreviations defined by the current <varname>TimeZone</varname>
+        setting).  The default is <literal>'Default'</literal>,
          which is a collection that works in most of the world; there are
          also <literal>'Australia'</literal> and <literal>'India'</literal>,
          and other collections can be defined for a particular installation.
diff --git a/doc/src/sgml/datatype.sgml b/doc/src/sgml/datatype.sgml

index 3e6751d64cc70f6b5d5b44fd62ce8d6db1cede15..1d9127e94e44bd431e397a7aebf1a2ca9de17da8 100644 (file)
--- a/doc/src/sgml/datatype.sgml
+++ b/doc/src/sgml/datatype.sgml
@@ -2534,6 +2534,10 @@ TIMESTAMP WITH TIME ZONE '2004-10-19 10:23:54+02'
       abbreviation if one is in common use in the current zone.  Otherwise
       it appears as a signed numeric offset in ISO 8601 basic format
       (<replaceable>hh</replaceable> or <replaceable>hhmm</replaceable>).
+     The alphabetic abbreviations shown in these styles are taken from the
+     IANA time zone database entry currently selected by the
+     <xref linkend="guc-timezone"/> run-time parameter; they are not
+     affected by the <xref linkend="guc-timezone-abbreviations"/> setting.
      </para>
  
      <para>
diff --git a/doc/src/sgml/datetime.sgml b/doc/src/sgml/datetime.sgml

index e7035c7806538322d8b45fb61411fbf5d784f777..3e24170acbfcc3823cfac64e292fa97b7e601a84 100644 (file)
--- a/doc/src/sgml/datetime.sgml
+++ b/doc/src/sgml/datetime.sgml
@@ -80,7 +80,7 @@
        <step>
         <para>
          See if the token matches any known time zone abbreviation.
-        These abbreviations are supplied by the configuration file
+        These abbreviations are determined by the configuration settings
          described in <xref linkend="datetime-config-files"/>.
         </para>
        </step>
@@ -424,9 +424,43 @@
     <para>
      Since timezone abbreviations are not well standardized,
      <productname>PostgreSQL</productname> provides a means to customize
-    the set of abbreviations accepted by the server.  The
-    <xref linkend="guc-timezone-abbreviations"/> run-time parameter
-    determines the active set of abbreviations.  While this parameter
+    the set of abbreviations accepted in datetime input.
+    There are two sources for these abbreviations:
+
+    <orderedlist>
+     <listitem>
+      <para>
+       The <xref linkend="guc-timezone"/> run-time parameter is usually
+       set to the name of an entry in the IANA time zone database.
+       If that zone has widely-used zone abbreviations, they will appear
+       in the IANA data, and <productname>PostgreSQL</productname> will
+       preferentially recognize those abbreviations with the meanings
+       given in the IANA data.
+       For example, if <varname>timezone</varname> is set
+       to <literal>America/New_York</literal> then <literal>EST</literal>
+       will be understood as UTC-5 and <literal>EDT</literal> will be
+       understood as UTC-4.  (These IANA abbreviations will also be used
+       in datetime output, if <xref linkend="guc-datestyle"/> is set to a
+       style that prefers non-numeric zone abbreviations.)
+      </para>
+     </listitem>
+
+     <listitem>
+      <para>
+       If an abbreviation is not found in the current IANA time zone,
+       it is sought in the list specified by the
+       <xref linkend="guc-timezone-abbreviations"/> run-time parameter.
+       The <varname>timezone_abbreviations</varname> list is primarily
+       useful for allowing datetime input to recognize abbreviations for
+       time zones other than the current zone.  (These abbreviations will
+       not be used in datetime output.)
+      </para>
+     </listitem>
+    </orderedlist>
+   </para>
+
+   <para>
+    While the <varname>timezone_abbreviations</varname> parameter
      can be altered by any database user, the possible values for it
      are under the control of the database administrator &mdash; they
      are in fact names of configuration files stored in
diff --git a/doc/src/sgml/system-views.sgml b/doc/src/sgml/system-views.sgml

index a586156614d15179db42554403adf99d908445dc..8e2b0a7927b420daf79a9e04ddd756fc7d26a023 100644 (file)
--- a/doc/src/sgml/system-views.sgml
+++ b/doc/src/sgml/system-views.sgml
@@ -4566,7 +4566,9 @@ SELECT * FROM pg_locks pl LEFT JOIN pg_prepared_xacts ppx
     The view <structname>pg_timezone_abbrevs</structname> provides a list
     of time zone abbreviations that are currently recognized by the datetime
     input routines.  The contents of this view change when the
-   <xref linkend="guc-timezone-abbreviations"/> run-time parameter is modified.
+   <xref linkend="guc-timezone"/> or
+   <xref linkend="guc-timezone-abbreviations"/> run-time parameters are
+   modified.
    </para>
  
    <table>
diff --git a/src/backend/catalog/system_views.sql b/src/backend/catalog/system_views.sql

index 64a873a16e3cdb565e25334cce651143b5375e7d..46868bf7e89123d92fcd6e52c2b2cbaf49a72b3b 100644 (file)
--- a/src/backend/catalog/system_views.sql
+++ b/src/backend/catalog/system_views.sql
@@ -634,7 +634,12 @@ REVOKE ALL ON pg_ident_file_mappings FROM PUBLIC;
  REVOKE EXECUTE ON FUNCTION pg_ident_file_mappings() FROM PUBLIC;
  
  CREATE VIEW pg_timezone_abbrevs AS
-    SELECT * FROM pg_timezone_abbrevs();
+    SELECT * FROM pg_timezone_abbrevs_zone() z
+    UNION ALL
+    (SELECT * FROM pg_timezone_abbrevs_abbrevs() a
+     WHERE NOT EXISTS (SELECT 1 FROM pg_timezone_abbrevs_zone() z2
+                       WHERE z2.abbrev = a.abbrev))
+    ORDER BY abbrev;
  
  CREATE VIEW pg_timezone_names AS
      SELECT * FROM pg_timezone_names();
diff --git a/src/backend/commands/variable.c b/src/backend/commands/variable.c

index 44796bf15ad4f80e5316e6796ee9b65792087c2c..4ad6e236d69928382060fcbea1f4e9bc3e157785 100644 (file)
--- a/src/backend/commands/variable.c
+++ b/src/backend/commands/variable.c
@@ -381,6 +381,8 @@ void
  assign_timezone(const char *newval, void *extra)
  {
     session_timezone = *((pg_tz **) extra);
+   /* datetime.c's cache of timezone abbrevs may now be obsolete */
+   ClearTimeZoneAbbrevCache();
  }
  
  /*
diff --git a/src/backend/utils/adt/datetime.c b/src/backend/utils/adt/datetime.c

index d8af3591d1791b5d41ff9b6e939db3408e4113d1..5d893cff50c8fd18235a05931c60636ea6bbaa4a 100644 (file)
--- a/src/backend/utils/adt/datetime.c
+++ b/src/backend/utils/adt/datetime.c
@@ -259,7 +259,17 @@ static const datetkn *datecache[MAXDATEFIELDS] = {NULL};
  
  static const datetkn *deltacache[MAXDATEFIELDS] = {NULL};
  
-static const datetkn *abbrevcache[MAXDATEFIELDS] = {NULL};
+/* Cache for results of timezone abbreviation lookups */
+
+typedef struct TzAbbrevCache
+{
+   char        abbrev[TOKMAXLEN + 1];  /* always NUL-terminated */
+   char        ftype;          /* TZ, DTZ, or DYNTZ */
+   int         offset;         /* GMT offset, if fixed-offset */
+   pg_tz      *tz;             /* relevant zone, if variable-offset */
+} TzAbbrevCache;
+
+static TzAbbrevCache tzabbrevcache[MAXDATEFIELDS];
  
  
  /*
@@ -1845,6 +1855,40 @@ DetermineTimeZoneAbbrevOffsetInternal(pg_time_t t, const char *abbr, pg_tz *tzp,
  }
  
  
+/* TimeZoneAbbrevIsKnown()
+ *
+ * Detect whether the given string is a time zone abbreviation that's known
+ * in the specified TZDB timezone, and if so whether it's fixed or varying
+ * meaning.  The match is not case-sensitive.
+ */
+static bool
+TimeZoneAbbrevIsKnown(const char *abbr, pg_tz *tzp,
+                     bool *isfixed, int *offset, int *isdst)
+{
+   char        upabbr[TZ_STRLEN_MAX + 1];
+   unsigned char *p;
+   long int    gmtoff;
+
+   /* We need to force the abbrev to upper case */
+   strlcpy(upabbr, abbr, sizeof(upabbr));
+   for (p = (unsigned char *) upabbr; *p; p++)
+       *p = pg_toupper(*p);
+
+   /* Look up the abbrev's meaning in this zone */
+   if (pg_timezone_abbrev_is_known(upabbr,
+                                   isfixed,
+                                   &gmtoff,
+                                   isdst,
+                                   tzp))
+   {
+       /* Change sign to agree with DetermineTimeZoneOffset() */
+       *offset = (int) -gmtoff;
+       return true;
+   }
+   return false;
+}
+
+
  /* DecodeTimeOnly()
   * Interpret parsed string as time fields only.
   * Returns 0 if successful, DTERR code if bogus input detected.
@@ -3092,27 +3136,60 @@ DecodeTimezoneAbbrev(int field, const char *lowtoken,
                      int *ftype, int *offset, pg_tz **tz,
                      DateTimeErrorExtra *extra)
  {
+   TzAbbrevCache *tzc = &tzabbrevcache[field];
+   bool        isfixed;
+   int         isdst;
     const datetkn *tp;
  
-   tp = abbrevcache[field];
-   /* use strncmp so that we match truncated tokens */
-   if (tp == NULL || strncmp(lowtoken, tp->token, TOKMAXLEN) != 0)
+   /*
+    * Do we have a cached result?  Use strncmp so that we match truncated
+    * names, although we shouldn't really see that happen with normal
+    * abbreviations.
+    */
+   if (strncmp(lowtoken, tzc->abbrev, TOKMAXLEN) == 0)
     {
-       if (zoneabbrevtbl)
-           tp = datebsearch(lowtoken, zoneabbrevtbl->abbrevs,
-                            zoneabbrevtbl->numabbrevs);
-       else
-           tp = NULL;
+       *ftype = tzc->ftype;
+       *offset = tzc->offset;
+       *tz = tzc->tz;
+       return 0;
+   }
+
+   /*
+    * See if the current session_timezone recognizes it.  Checking this
+    * before zoneabbrevtbl allows us to correctly handle abbreviations whose
+    * meaning varies across zones, such as "LMT".
+    */
+   if (session_timezone &&
+       TimeZoneAbbrevIsKnown(lowtoken, session_timezone,
+                             &isfixed, offset, &isdst))
+   {
+       *ftype = (isfixed ? (isdst ? DTZ : TZ) : DYNTZ);
+       *tz = (isfixed ? NULL : session_timezone);
+       /* flip sign to agree with the convention used in zoneabbrevtbl */
+       *offset = -(*offset);
+       /* cache result; use strlcpy to truncate name if necessary */
+       strlcpy(tzc->abbrev, lowtoken, TOKMAXLEN + 1);
+       tzc->ftype = *ftype;
+       tzc->offset = *offset;
+       tzc->tz = *tz;
+       return 0;
     }
+
+   /* Nope, so look in zoneabbrevtbl */
+   if (zoneabbrevtbl)
+       tp = datebsearch(lowtoken, zoneabbrevtbl->abbrevs,
+                        zoneabbrevtbl->numabbrevs);
+   else
+       tp = NULL;
     if (tp == NULL)
     {
         *ftype = UNKNOWN_FIELD;
         *offset = 0;
         *tz = NULL;
+       /* failure results are not cached */
     }
     else
     {
-       abbrevcache[field] = tp;
         *ftype = tp->type;
         if (tp->type == DYNTZ)
         {
@@ -3126,11 +3203,26 @@ DecodeTimezoneAbbrev(int field, const char *lowtoken,
             *offset = tp->value;
             *tz = NULL;
         }
+
+       /* cache result; use strlcpy to truncate name if necessary */
+       strlcpy(tzc->abbrev, lowtoken, TOKMAXLEN + 1);
+       tzc->ftype = *ftype;
+       tzc->offset = *offset;
+       tzc->tz = *tz;
     }
  
     return 0;
  }
  
+/*
+ * Reset tzabbrevcache after a change in session_timezone.
+ */
+void
+ClearTimeZoneAbbrevCache(void)
+{
+   memset(tzabbrevcache, 0, sizeof(tzabbrevcache));
+}
+
  
  /* DecodeSpecial()
   * Decode text string using lookup table.
@@ -3278,9 +3370,6 @@ DecodeTimezoneAbbrevPrefix(const char *str, int *offset, pg_tz **tz)
     *offset = 0;                /* avoid uninitialized vars on failure */
     *tz = NULL;
  
-   if (!zoneabbrevtbl)
-       return -1;              /* no abbrevs known, so fail immediately */
-
     /* Downcase as much of the string as we could need */
     for (len = 0; len < TOKMAXLEN; len++)
     {
@@ -3299,9 +3388,34 @@ DecodeTimezoneAbbrevPrefix(const char *str, int *offset, pg_tz **tz)
      */
     while (len > 0)
     {
-       const datetkn *tp = datebsearch(lowtoken, zoneabbrevtbl->abbrevs,
-                                       zoneabbrevtbl->numabbrevs);
+       bool        isfixed;
+       int         isdst;
+       const datetkn *tp;
+
+       /* See if the current session_timezone recognizes it. */
+       if (session_timezone &&
+           TimeZoneAbbrevIsKnown(lowtoken, session_timezone,
+                                 &isfixed, offset, &isdst))
+       {
+           if (isfixed)
+           {
+               /* flip sign to agree with the convention in zoneabbrevtbl */
+               *offset = -(*offset);
+           }
+           else
+           {
+               /* Caller must resolve the abbrev's current meaning */
+               *tz = session_timezone;
+           }
+           return len;
+       }
  
+       /* Known in zoneabbrevtbl? */
+       if (zoneabbrevtbl)
+           tp = datebsearch(lowtoken, zoneabbrevtbl->abbrevs,
+                            zoneabbrevtbl->numabbrevs);
+       else
+           tp = NULL;
         if (tp != NULL)
         {
             if (tp->type == DYNTZ)
@@ -3324,6 +3438,8 @@ DecodeTimezoneAbbrevPrefix(const char *str, int *offset, pg_tz **tz)
                 return len;
             }
         }
+
+       /* Nope, try the next shorter string. */
         lowtoken[--len] = '\0';
     }
  
@@ -4957,8 +5073,8 @@ void
  InstallTimeZoneAbbrevs(TimeZoneAbbrevTable *tbl)
  {
     zoneabbrevtbl = tbl;
-   /* reset abbrevcache, which may contain pointers into old table */
-   memset(abbrevcache, 0, sizeof(abbrevcache));
+   /* reset tzabbrevcache, which may contain results from old table */
+   memset(tzabbrevcache, 0, sizeof(tzabbrevcache));
  }
  
  /*
@@ -4994,11 +5110,99 @@ FetchDynamicTimeZone(TimeZoneAbbrevTable *tbl, const datetkn *tp,
  
  
  /*
- * This set-returning function reads all the available time zone abbreviations
+ * This set-returning function reads all the time zone abbreviations
+ * defined by the IANA data for the current timezone setting,
+ * and returns a set of (abbrev, utc_offset, is_dst).
+ */
+Datum
+pg_timezone_abbrevs_zone(PG_FUNCTION_ARGS)
+{
+   FuncCallContext *funcctx;
+   int        *pindex;
+   Datum       result;
+   HeapTuple   tuple;
+   Datum       values[3];
+   bool        nulls[3] = {0};
+   TimestampTz now = GetCurrentTransactionStartTimestamp();
+   pg_time_t   t = timestamptz_to_time_t(now);
+   const char *abbrev;
+   long int    gmtoff;
+   int         isdst;
+   struct pg_itm_in itm_in;
+   Interval   *resInterval;
+
+   /* stuff done only on the first call of the function */
+   if (SRF_IS_FIRSTCALL())
+   {
+       TupleDesc   tupdesc;
+       MemoryContext oldcontext;
+
+       /* create a function context for cross-call persistence */
+       funcctx = SRF_FIRSTCALL_INIT();
+
+       /*
+        * switch to memory context appropriate for multiple function calls
+        */
+       oldcontext = MemoryContextSwitchTo(funcctx->multi_call_memory_ctx);
+
+       /* allocate memory for user context */
+       pindex = (int *) palloc(sizeof(int));
+       *pindex = 0;
+       funcctx->user_fctx = pindex;
+
+       if (get_call_result_type(fcinfo, NULL, &tupdesc) != TYPEFUNC_COMPOSITE)
+           elog(ERROR, "return type must be a row type");
+       funcctx->tuple_desc = tupdesc;
+
+       MemoryContextSwitchTo(oldcontext);
+   }
+
+   /* stuff done on every call of the function */
+   funcctx = SRF_PERCALL_SETUP();
+   pindex = (int *) funcctx->user_fctx;
+
+   while ((abbrev = pg_get_next_timezone_abbrev(pindex,
+                                                session_timezone)) != NULL)
+   {
+       /* Ignore abbreviations that aren't all-alphabetic */
+       if (strspn(abbrev, "ABCDEFGHIJKLMNOPQRSTUVWXYZ") != strlen(abbrev))
+           continue;
+
+       /* Determine the current meaning of the abbrev */
+       if (!pg_interpret_timezone_abbrev(abbrev,
+                                         &t,
+                                         &gmtoff,
+                                         &isdst,
+                                         session_timezone))
+           continue;           /* hm, not actually used in this zone? */
+
+       values[0] = CStringGetTextDatum(abbrev);
+
+       /* Convert offset (in seconds) to an interval; can't overflow */
+       MemSet(&itm_in, 0, sizeof(struct pg_itm_in));
+       itm_in.tm_usec = (int64) gmtoff * USECS_PER_SEC;
+       resInterval = (Interval *) palloc(sizeof(Interval));
+       (void) itmin2interval(&itm_in, resInterval);
+       values[1] = IntervalPGetDatum(resInterval);
+
+       values[2] = BoolGetDatum(isdst);
+
+       tuple = heap_form_tuple(funcctx->tuple_desc, values, nulls);
+       result = HeapTupleGetDatum(tuple);
+
+       SRF_RETURN_NEXT(funcctx, result);
+   }
+
+   SRF_RETURN_DONE(funcctx);
+}
+
+/*
+ * This set-returning function reads all the time zone abbreviations
+ * defined by the timezone_abbreviations setting,
   * and returns a set of (abbrev, utc_offset, is_dst).
   */
  Datum
-pg_timezone_abbrevs(PG_FUNCTION_ARGS)
+pg_timezone_abbrevs_abbrevs(PG_FUNCTION_ARGS)
  {
     FuncCallContext *funcctx;
     int        *pindex;
diff --git a/src/include/catalog/catversion.h b/src/include/catalog/catversion.h

index e5446845614ec782018e4b89ab19494e76e9233b..54856ab214d40401195ff4a3f58a303993f176c9 100644 (file)
--- a/src/include/catalog/catversion.h
+++ b/src/include/catalog/catversion.h
@@ -57,6 +57,6 @@
   */
  
  /*                         yyyymmddN */
-#define CATALOG_VERSION_NO 202501161
+#define CATALOG_VERSION_NO 202501162
  
  #endif
diff --git a/src/include/catalog/pg_proc.dat b/src/include/catalog/pg_proc.dat

index ba02ba53b29adf74e18d681576dd01abd0347b8f..18560755d26f4742d02a847793f100d845fe961a 100644 (file)
--- a/src/include/catalog/pg_proc.dat
+++ b/src/include/catalog/pg_proc.dat
@@ -8392,12 +8392,18 @@
    proargmodes => '{o,o,o,o,o,o}',
    proargnames => '{name,statement,is_holdable,is_binary,is_scrollable,creation_time}',
    prosrc => 'pg_cursor' },
-{ oid => '2599', descr => 'get the available time zone abbreviations',
-  proname => 'pg_timezone_abbrevs', prorows => '1000', proretset => 't',
+{ oid => '9221', descr => 'get abbreviations from current timezone',
+  proname => 'pg_timezone_abbrevs_zone', prorows => '10', proretset => 't',
    provolatile => 's', prorettype => 'record', proargtypes => '',
    proallargtypes => '{text,interval,bool}', proargmodes => '{o,o,o}',
    proargnames => '{abbrev,utc_offset,is_dst}',
-  prosrc => 'pg_timezone_abbrevs' },
+  prosrc => 'pg_timezone_abbrevs_zone' },
+{ oid => '2599', descr => 'get abbreviations from timezone_abbreviations',
+  proname => 'pg_timezone_abbrevs_abbrevs', prorows => '1000', proretset => 't',
+  provolatile => 's', prorettype => 'record', proargtypes => '',
+  proallargtypes => '{text,interval,bool}', proargmodes => '{o,o,o}',
+  proargnames => '{abbrev,utc_offset,is_dst}',
+  prosrc => 'pg_timezone_abbrevs_abbrevs' },
  { oid => '2856', descr => 'get the available time zone names',
    proname => 'pg_timezone_names', prorows => '1000', proretset => 't',
    provolatile => 's', prorettype => 'record', proargtypes => '',
diff --git a/src/include/pgtime.h b/src/include/pgtime.h

index 37171f17374b896043d14b51f864bafd92a27506..5fc9f223de30a1d9c25edf91d03ded2c8cb4be52 100644 (file)
--- a/src/include/pgtime.h
+++ b/src/include/pgtime.h
@@ -69,6 +69,13 @@ extern bool pg_interpret_timezone_abbrev(const char *abbrev,
                                          long int *gmtoff,
                                          int *isdst,
                                          const pg_tz *tz);
+extern bool pg_timezone_abbrev_is_known(const char *abbrev,
+                                       bool *isfixed,
+                                       long int *gmtoff,
+                                       int *isdst,
+                                       const pg_tz *tz);
+extern const char *pg_get_next_timezone_abbrev(int *indx,
+                                              const pg_tz *tz);
  extern bool pg_get_timezone_offset(const pg_tz *tz, long int *gmtoff);
  extern const char *pg_get_timezone_name(pg_tz *tz);
  extern bool pg_tz_acceptable(pg_tz *tz);
diff --git a/src/include/utils/datetime.h b/src/include/utils/datetime.h

index 7fe12a4ea70fd948fffa882a71c02fcbfa9f3116..53a1c69eda52dea31af1fa8a2d87ea92687ec0e4 100644 (file)
--- a/src/include/utils/datetime.h
+++ b/src/include/utils/datetime.h
@@ -351,6 +351,8 @@ extern pg_tz *DecodeTimezoneNameToTz(const char *tzname);
  extern int DecodeTimezoneAbbrevPrefix(const char *str,
                                        int *offset, pg_tz **tz);
  
+extern void ClearTimeZoneAbbrevCache(void);
+
  extern int j2day(int date);
  
  extern struct Node *TemporalSimplify(int32 max_precis, struct Node *node);
diff --git a/src/test/regress/expected/horology.out b/src/test/regress/expected/horology.out

index cb28dfbaee71631af397450513e26a92a18a37d0..b90bfcd794f450fdb94c518f16ed64244c0cd8b5 100644 (file)
--- a/src/test/regress/expected/horology.out
+++ b/src/test/regress/expected/horology.out
@@ -3332,6 +3332,12 @@ SELECT to_timestamp('2011-12-18 11:38 MSK', 'YYYY-MM-DD HH12:MI TZ');  -- dyntz
   Sat Dec 17 23:38:00 2011 PST
  (1 row)
  
+SELECT to_timestamp('2011-12-18 00:00 LMT', 'YYYY-MM-DD HH24:MI TZ');  -- dyntz
+         to_timestamp         
+------------------------------
+ Sat Dec 17 23:52:58 2011 PST
+(1 row)
+
  SELECT to_timestamp('2011-12-18 11:38ESTFOO24', 'YYYY-MM-DD HH12:MITZFOOSS');
           to_timestamp         
  ------------------------------
diff --git a/src/test/regress/expected/rules.out b/src/test/regress/expected/rules.out

index ff921bbda0094db6f187262432544e9cc6b8751e..856a8349c50536a2c4bd813a5f34516b1fd0bf23 100644 (file)
--- a/src/test/regress/expected/rules.out
+++ b/src/test/regress/expected/rules.out
@@ -2629,10 +2629,19 @@ pg_tables| SELECT n.nspname AS schemaname,
       LEFT JOIN pg_namespace n ON ((n.oid = c.relnamespace)))
       LEFT JOIN pg_tablespace t ON ((t.oid = c.reltablespace)))
    WHERE (c.relkind = ANY (ARRAY['r'::"char", 'p'::"char"]));
-pg_timezone_abbrevs| SELECT abbrev,
-    utc_offset,
-    is_dst
-   FROM pg_timezone_abbrevs() pg_timezone_abbrevs(abbrev, utc_offset, is_dst);
+pg_timezone_abbrevs| SELECT z.abbrev,
+    z.utc_offset,
+    z.is_dst
+   FROM pg_timezone_abbrevs_zone() z(abbrev, utc_offset, is_dst)
+UNION ALL
+ SELECT a.abbrev,
+    a.utc_offset,
+    a.is_dst
+   FROM pg_timezone_abbrevs_abbrevs() a(abbrev, utc_offset, is_dst)
+  WHERE (NOT (EXISTS ( SELECT 1
+           FROM pg_timezone_abbrevs_zone() z2(abbrev, utc_offset, is_dst)
+          WHERE (z2.abbrev = a.abbrev))))
+  ORDER BY 1;
  pg_timezone_names| SELECT name,
      abbrev,
      utc_offset,
diff --git a/src/test/regress/expected/sysviews.out b/src/test/regress/expected/sysviews.out

index 91089ac215f34f599e4906e8fce36aa1043bbb9a..352abc0bd424ec445f52c2450d9a4b80ac0b61c1 100644 (file)
--- a/src/test/regress/expected/sysviews.out
+++ b/src/test/regress/expected/sysviews.out
@@ -223,3 +223,11 @@ select count(distinct utc_offset) >= 24 as ok from pg_timezone_abbrevs;
   t
  (1 row)
  
+-- One specific case we can check without much fear of breakage
+-- is the historical local-mean-time value used for America/Los_Angeles.
+select * from pg_timezone_abbrevs where abbrev = 'LMT';
+ abbrev |          utc_offset           | is_dst 
+--------+-------------------------------+--------
+ LMT    | @ 7 hours 52 mins 58 secs ago | f
+(1 row)
+
diff --git a/src/test/regress/expected/timestamptz.out b/src/test/regress/expected/timestamptz.out

index a6dd45626ce6f1bfc6649efaa3cb4282a06cd86c..36349e363f292bfac41ef9953ec949f18c1a3496 100644 (file)
--- a/src/test/regress/expected/timestamptz.out
+++ b/src/test/regress/expected/timestamptz.out
@@ -176,6 +176,65 @@ SELECT '205000-01-10 17:32:01 Europe/Helsinki'::timestamptz; -- non-DST
   Fri Jan 10 07:32:01 205000 PST
  (1 row)
  
+-- Recognize "LMT" as whatever it means in the current zone
+SELECT 'Jan 01 00:00:00 1000 LMT'::timestamptz;
+         timestamptz          
+------------------------------
+ Wed Jan 01 00:00:00 1000 LMT
+(1 row)
+
+SELECT 'Jan 01 00:00:00 2024 LMT'::timestamptz;
+         timestamptz          
+------------------------------
+ Sun Dec 31 23:52:58 2023 PST
+(1 row)
+
+SET timezone = 'Europe/London';
+SELECT 'Jan 01 00:00:00 1000 LMT'::timestamptz;
+         timestamptz          
+------------------------------
+ Wed Jan 01 00:00:00 1000 LMT
+(1 row)
+
+SELECT 'Jan 01 00:00:00 2024 LMT'::timestamptz;
+         timestamptz          
+------------------------------
+ Mon Jan 01 00:01:15 2024 GMT
+(1 row)
+
+-- which might be nothing
+SET timezone = 'UTC';
+SELECT 'Jan 01 00:00:00 2024 LMT'::timestamptz;  -- fail
+ERROR:  invalid input syntax for type timestamp with time zone: "Jan 01 00:00:00 2024 LMT"
+LINE 1: SELECT 'Jan 01 00:00:00 2024 LMT'::timestamptz;
+               ^
+-- Another example of an abbrev that varies across zones
+SELECT '1912-01-01 00:00 MMT'::timestamptz;  -- from timezone_abbreviations
+         timestamptz          
+------------------------------
+ Sun Dec 31 17:30:00 1911 UTC
+(1 row)
+
+SET timezone = 'America/Montevideo';
+SELECT '1912-01-01 00:00'::timestamptz;
+         timestamptz          
+------------------------------
+ Mon Jan 01 00:00:00 1912 MMT
+(1 row)
+
+SELECT '1912-01-01 00:00 MMT'::timestamptz;
+         timestamptz          
+------------------------------
+ Mon Jan 01 00:00:00 1912 MMT
+(1 row)
+
+SELECT '1912-01-01 00:00 MMT'::timestamptz AT TIME ZONE 'UTC';
+         timezone         
+--------------------------
+ Mon Jan 01 03:44:51 1912
+(1 row)
+
+RESET timezone;
  -- Test non-error-throwing API
  SELECT pg_input_is_valid('now', 'timestamptz');
   pg_input_is_valid 
diff --git a/src/test/regress/sql/horology.sql b/src/test/regress/sql/horology.sql

index 4aa88b4ba9a823e4eea26a5446ea772fac8910c5..1310b43277380649299ee6df87378f71ba2d89bf 100644 (file)
--- a/src/test/regress/sql/horology.sql
+++ b/src/test/regress/sql/horology.sql
@@ -538,6 +538,7 @@ SELECT to_timestamp('2011-12-18 11:38 EST', 'YYYY-MM-DD HH12:MI TZ');
  SELECT to_timestamp('2011-12-18 11:38 -05', 'YYYY-MM-DD HH12:MI TZ');
  SELECT to_timestamp('2011-12-18 11:38 +01:30', 'YYYY-MM-DD HH12:MI TZ');
  SELECT to_timestamp('2011-12-18 11:38 MSK', 'YYYY-MM-DD HH12:MI TZ');  -- dyntz
+SELECT to_timestamp('2011-12-18 00:00 LMT', 'YYYY-MM-DD HH24:MI TZ');  -- dyntz
  SELECT to_timestamp('2011-12-18 11:38ESTFOO24', 'YYYY-MM-DD HH12:MITZFOOSS');
  SELECT to_timestamp('2011-12-18 11:38-05FOO24', 'YYYY-MM-DD HH12:MITZFOOSS');
  SELECT to_timestamp('2011-12-18 11:38 JUNK', 'YYYY-MM-DD HH12:MI TZ');  -- error
diff --git a/src/test/regress/sql/sysviews.sql b/src/test/regress/sql/sysviews.sql

index b2a79237543ac359690ebe4c18479c0d548445db..66179f026b379d56f71084ae02c3d5ad7322da1e 100644 (file)
--- a/src/test/regress/sql/sysviews.sql
+++ b/src/test/regress/sql/sysviews.sql
@@ -98,3 +98,6 @@ set timezone_abbreviations = 'Australia';
  select count(distinct utc_offset) >= 24 as ok from pg_timezone_abbrevs;
  set timezone_abbreviations = 'India';
  select count(distinct utc_offset) >= 24 as ok from pg_timezone_abbrevs;
+-- One specific case we can check without much fear of breakage
+-- is the historical local-mean-time value used for America/Los_Angeles.
+select * from pg_timezone_abbrevs where abbrev = 'LMT';
diff --git a/src/test/regress/sql/timestamptz.sql b/src/test/regress/sql/timestamptz.sql

index a92586c363e20b94432ca9a17f10fb5623dea074..2fa5378a572b58123870227af22ff47dc3047a24 100644 (file)
--- a/src/test/regress/sql/timestamptz.sql
+++ b/src/test/regress/sql/timestamptz.sql
@@ -109,6 +109,23 @@ SELECT '20500110 173201 Europe/Helsinki'::timestamptz; -- non-DST
  SELECT '205000-07-10 17:32:01 Europe/Helsinki'::timestamptz; -- DST
  SELECT '205000-01-10 17:32:01 Europe/Helsinki'::timestamptz; -- non-DST
  
+-- Recognize "LMT" as whatever it means in the current zone
+SELECT 'Jan 01 00:00:00 1000 LMT'::timestamptz;
+SELECT 'Jan 01 00:00:00 2024 LMT'::timestamptz;
+SET timezone = 'Europe/London';
+SELECT 'Jan 01 00:00:00 1000 LMT'::timestamptz;
+SELECT 'Jan 01 00:00:00 2024 LMT'::timestamptz;
+-- which might be nothing
+SET timezone = 'UTC';
+SELECT 'Jan 01 00:00:00 2024 LMT'::timestamptz;  -- fail
+-- Another example of an abbrev that varies across zones
+SELECT '1912-01-01 00:00 MMT'::timestamptz;  -- from timezone_abbreviations
+SET timezone = 'America/Montevideo';
+SELECT '1912-01-01 00:00'::timestamptz;
+SELECT '1912-01-01 00:00 MMT'::timestamptz;
+SELECT '1912-01-01 00:00 MMT'::timestamptz AT TIME ZONE 'UTC';
+RESET timezone;
+
  -- Test non-error-throwing API
  SELECT pg_input_is_valid('now', 'timestamptz');
  SELECT pg_input_is_valid('garbage', 'timestamptz');
diff --git a/src/timezone/localtime.c b/src/timezone/localtime.c

index 21516c65082ed84571c3c5458417261f0223fbc1..8eb02ef14691cb3b06161f1ea6415d33c3b5d4e8 100644 (file)
--- a/src/timezone/localtime.c
+++ b/src/timezone/localtime.c
@@ -1843,6 +1843,120 @@ pg_interpret_timezone_abbrev(const char *abbrev,
     return false;               /* hm, not actually used in any interval? */
  }
  
+/*
+ * Detect whether a timezone abbreviation is defined within the given zone.
+ *
+ * This is similar to pg_interpret_timezone_abbrev() but is not concerned
+ * with a specific point in time.  We want to know if the abbreviation is
+ * known at all, and if so whether it has one meaning or several.
+ *
+ * Returns true if the abbreviation is known, false if not.
+ * If the abbreviation is known and has a single meaning (only one value
+ * of gmtoff/isdst), sets *isfixed = true and sets *gmtoff and *isdst.
+ * If there are multiple meanings, sets *isfixed = false.
+ *
+ * Note: abbrev is matched case-sensitively; it should be all-upper-case.
+ */
+bool
+pg_timezone_abbrev_is_known(const char *abbrev,
+                           bool *isfixed,
+                           long int *gmtoff,
+                           int *isdst,
+                           const pg_tz *tz)
+{
+   bool        result = false;
+   const struct state *sp = &tz->state;
+   const char *abbrs;
+   int         abbrind;
+
+   /*
+    * Locate the abbreviation in the zone's abbreviation list.  We assume
+    * there are not duplicates in the list.
+    */
+   abbrs = sp->chars;
+   abbrind = 0;
+   while (abbrind < sp->charcnt)
+   {
+       if (strcmp(abbrev, abbrs + abbrind) == 0)
+           break;
+       while (abbrs[abbrind] != '\0')
+           abbrind++;
+       abbrind++;
+   }
+   if (abbrind >= sp->charcnt)
+       return false;           /* definitely not there */
+
+   /*
+    * Scan the ttinfo array to find uses of the abbreviation.
+    */
+   for (int i = 0; i < sp->typecnt; i++)
+   {
+       const struct ttinfo *ttisp = &sp->ttis[i];
+
+       if (ttisp->tt_desigidx == abbrind)
+       {
+           if (!result)
+           {
+               /* First usage */
+               *isfixed = true;    /* for the moment */
+               *gmtoff = ttisp->tt_utoff;
+               *isdst = ttisp->tt_isdst;
+               result = true;
+           }
+           else
+           {
+               /* Second or later usage, does it match? */
+               if (*gmtoff != ttisp->tt_utoff ||
+                   *isdst != ttisp->tt_isdst)
+               {
+                   *isfixed = false;
+                   break;      /* no point in looking further */
+               }
+           }
+       }
+   }
+
+   return result;
+}
+
+/*
+ * Iteratively fetch all the abbreviations used in the given time zone.
+ *
+ * *indx is a state counter that the caller must initialize to zero
+ * before the first call, and not touch between calls.
+ *
+ * Returns the next known abbreviation, or NULL if there are no more.
+ *
+ * Note: the caller typically applies pg_interpret_timezone_abbrev()
+ * to each result.  While that nominally results in O(N^2) time spent
+ * searching the sp->chars[] array, we don't expect any zone to have
+ * enough abbreviations to make that meaningful.
+ */
+const char *
+pg_get_next_timezone_abbrev(int *indx,
+                           const pg_tz *tz)
+{
+   const char *result;
+   const struct state *sp = &tz->state;
+   const char *abbrs;
+   int         abbrind;
+
+   /* If we're still in range, the result is the current abbrev. */
+   abbrs = sp->chars;
+   abbrind = *indx;
+   if (abbrind < 0 || abbrind >= sp->charcnt)
+       return NULL;
+   result = abbrs + abbrind;
+
+   /* Advance *indx past this abbrev and its trailing null. */
+   while (abbrs[abbrind] != '\0')
+       abbrind++;
+   abbrind++;
+   *indx = abbrind;
+
+   return result;
+}
+
  /*
   * If the given timezone uses only one GMT offset, store that offset
   * into *gmtoff and return true, else return false.
diff --git a/src/tools/pgindent/typedefs.list b/src/tools/pgindent/typedefs.list

index 56ba63f3d923b7ee7648a762d72830029d422ff1..ebba5b7c9537c1b5a876553847296c4930f7c24b 100644 (file)
--- a/src/tools/pgindent/typedefs.list
+++ b/src/tools/pgindent/typedefs.list
@@ -3036,6 +3036,7 @@ TypeCat
  TypeFuncClass
  TypeInfo
  TypeName
+TzAbbrevCache
  U32
  U8
  UChar
author	Tom Lane <tgl@sss.pgh.pa.us>
	Thu, 16 Jan 2025 19:11:19 +0000 (14:11 -0500)
committer	Tom Lane <tgl@sss.pgh.pa.us>
	Thu, 16 Jan 2025 19:11:19 +0000 (14:11 -0500)
doc/src/sgml/config.sgml		patch \| blob \| blame \| history
doc/src/sgml/datatype.sgml		patch \| blob \| blame \| history
doc/src/sgml/datetime.sgml		patch \| blob \| blame \| history
doc/src/sgml/system-views.sgml		patch \| blob \| blame \| history
src/backend/catalog/system_views.sql		patch \| blob \| blame \| history
src/backend/commands/variable.c		patch \| blob \| blame \| history
src/backend/utils/adt/datetime.c		patch \| blob \| blame \| history
src/include/catalog/catversion.h		patch \| blob \| blame \| history
src/include/catalog/pg_proc.dat		patch \| blob \| blame \| history
src/include/pgtime.h		patch \| blob \| blame \| history
src/include/utils/datetime.h		patch \| blob \| blame \| history
src/test/regress/expected/horology.out		patch \| blob \| blame \| history
src/test/regress/expected/rules.out		patch \| blob \| blame \| history
src/test/regress/expected/sysviews.out		patch \| blob \| blame \| history
src/test/regress/expected/timestamptz.out		patch \| blob \| blame \| history
src/test/regress/sql/horology.sql		patch \| blob \| blame \| history
src/test/regress/sql/sysviews.sql		patch \| blob \| blame \| history
src/test/regress/sql/timestamptz.sql		patch \| blob \| blame \| history
src/timezone/localtime.c		patch \| blob \| blame \| history
src/tools/pgindent/typedefs.list		patch \| blob \| blame \| history