proxy/logging/LogUtils.cc - trafficserver - Git at Google

 /** @file

  This file contains a set of utility routines that are used throughout the
  logging implementation.

   @section license License

   Licensed to the Apache Software Foundation (ASF) under one
   or more contributor license agreements.  See the NOTICE file
   distributed with this work for additional information
   regarding copyright ownership.  The ASF licenses this file
   to you under the Apache License, Version 2.0 (the
   "License"); you may not use this file except in compliance
   with the License.  You may obtain a copy of the License at

       http://www.apache.org/licenses/LICENSE-2.0

   Unless required by applicable law or agreed to in writing, software
   distributed under the License is distributed on an "AS IS" BASIS,
   WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
   See the License for the specific language governing permissions and
   limitations under the License.
  */

 #include <tscore/ink_align.h>
 #include "tscore/ink_config.h"
 #include "tscore/ink_string.h"
 #include <tscore/ink_assert.h>
 #include <tscore/BufferWriter.h>

 #ifdef TEST_LOG_UTILS

 #include "unit-tests/test_LogUtils.h"

 #else

 #include <MIME.h>

 #endif

 #include <cassert>
 #include <cstdio>
 #include <cstdlib>
 #include <cstdarg>
 #include <cstring>
 #include <ctime>
 #include <string_view>
 #include <cstdint>

 #include <sys/time.h>
 #include <sys/types.h>
 #include <sys/stat.h>
 #include <unistd.h>
 #include <sys/socket.h>
 #include <netinet/in.h>
 #include <arpa/inet.h>
 #include <netdb.h>

 #include "records/P_RecProcess.h"
 // REC_SIGNAL_LOGGING_ERROR    is defined in I_RecSignals.h
 // REC_SIGNAL_LOGGING_WARNING  is defined in I_RecSignals.h

 #include "LogUtils.h"
 #include "LogLimits.h"

 /*-------------------------------------------------------------------------
   LogUtils::timestamp_to_str

   This routine will convert a timestamp (seconds) into a short string,
   of the format "%Y%m%d.%Hh%Mm%Ss".

   Since the resulting buffer is passed in, this routine is thread-safe.
   Return value is the number of characters placed into the array, not
   including the NULL.
   -------------------------------------------------------------------------*/

 int
 LogUtils::timestamp_to_str(long timestamp, char *buf, int size)
 {
   static const char *format_str = "%Y%m%d.%Hh%Mm%Ss";
   struct tm res;
   struct tm *tms;
   tms = ink_localtime_r((const time_t *)&timestamp, &res);
   return strftime(buf, size, format_str, tms);
 }

 /*-------------------------------------------------------------------------
   LogUtils::timestamp_to_netscape_str

   This routine will convert a timestamp (seconds) into a string compatible
   with the Netscape logging formats.

   This routine is intended to be called from the (single) logging thread,
   and is therefore NOT MULTITHREADED SAFE.  There is a single, static,
   string buffer that the time string is constructed into and returned.
   -------------------------------------------------------------------------*/

 char *
 LogUtils::timestamp_to_netscape_str(long timestamp)
 {
   static char timebuf[64]; // NOTE: not MT safe
   static long last_timestamp = 0;

   // safety check
   if (timestamp < 0) {
     static char bad_time[] = "Bad timestamp";
     return bad_time;
   }
   //
   // since we may have many entries per second, lets only do the
   // formatting if we actually have a new timestamp.
   //

   if (timestamp != last_timestamp) {
     //
     // most of this garbage is simply to find out the offset from GMT,
     // taking daylight savings into account.
     //
     struct tm res;
     struct tm *tms = ink_localtime_r((const time_t *)&timestamp, &res);
 #if defined(solaris)
     long zone = (tms->tm_isdst > 0) ? altzone : timezone;
 #else
     long zone = -tms->tm_gmtoff; // double negative!
 #endif
     int offset;
     char sign;

     if (zone >= 0) {
       offset = zone / 60;
       sign   = '-';
     } else {
       offset = zone / -60;
       sign   = '+';
     }

     static char gmtstr[16];
     int glen = snprintf(gmtstr, 16, "%c%.2d%.2d", sign, offset / 60, offset % 60);

     strftime(timebuf, 64 - glen, "%d/%b/%Y:%H:%M:%S ", tms);
     ink_strlcat(timebuf, gmtstr, sizeof(timebuf));
     last_timestamp = timestamp;
   }
   return timebuf;
 }

 /*-------------------------------------------------------------------------
   LogUtils::timestamp_to_date_str

   This routine will convert a timestamp (seconds) into a W3C compatible
   date string.
   -------------------------------------------------------------------------*/

 char *
 LogUtils::timestamp_to_date_str(long timestamp)
 {
   static char timebuf[64]; // NOTE: not MT safe
   static long last_timestamp = 0;

   // safety check
   if (timestamp < 0) {
     static char bad_time[] = "Bad timestamp";
     return bad_time;
   }
   //
   // since we may have many entries per second, lets only do the
   // formatting if we actually have a new timestamp.
   //

   if (timestamp != last_timestamp) {
     struct tm res;
     struct tm *tms = ink_localtime_r((const time_t *)&timestamp, &res);
     strftime(timebuf, 64, "%Y-%m-%d", tms);
     last_timestamp = timestamp;
   }
   return timebuf;
 }

 /*-------------------------------------------------------------------------
   LogUtils::timestamp_to_time_str

   This routine will convert a timestamp (seconds) into a W3C compatible
   time string.
   -------------------------------------------------------------------------*/

 char *
 LogUtils::timestamp_to_time_str(long timestamp)
 {
   static char timebuf[64]; // NOTE: not MT safe
   static long last_timestamp = 0;

   // safety check
   if (timestamp < 0) {
     static char bad_time[] = "Bad timestamp";
     return bad_time;
   }
   //
   // since we may have many entries per second, lets only do the
   // formatting if we actually have a new timestamp.
   //

   if (timestamp != last_timestamp) {
     struct tm res;
     struct tm *tms = ink_localtime_r((const time_t *)&timestamp, &res);
     strftime(timebuf, 64, "%H:%M:%S", tms);
     last_timestamp = timestamp;
   }
   return timebuf;
 }

 /*-------------------------------------------------------------------------
   LogUtils::manager_alarm

   This routine provides a convenient abstraction for sending the traffic
   server manager process an alarm.  The logging system can send
   LOG_ALARM_N_TYPES different types of alarms, as defined in LogUtils.h.
   Subsequent alarms of the same type will override the previous alarm
   entry.
   -------------------------------------------------------------------------*/

 void
 LogUtils::manager_alarm(LogUtils::AlarmType alarm_type, const char *msg, ...)
 {
   char msg_buf[LOG_MAX_FORMATTED_LINE];

   ink_assert(alarm_type >= 0 && alarm_type < LogUtils::LOG_ALARM_N_TYPES);

   if (msg == nullptr) {
     snprintf(msg_buf, sizeof(msg_buf), "No Message");
   } else {
     va_list ap;
     va_start(ap, msg);
     vsnprintf(msg_buf, LOG_MAX_FORMATTED_LINE, msg, ap);
     va_end(ap);
   }

   switch (alarm_type) {
   case LogUtils::LOG_ALARM_ERROR:
     RecSignalManager(REC_SIGNAL_LOGGING_ERROR, msg_buf);
     break;

   case LogUtils::LOG_ALARM_WARNING:
     RecSignalManager(REC_SIGNAL_LOGGING_WARNING, msg_buf);
     break;

   default:
     ink_assert(false);
   }
 }

 /*-------------------------------------------------------------------------
   LogUtils::strip_trailing_newline

   This routine examines the given string buffer to see if the last
   character before the trailing NULL is a newline ('\n').  If so, it will
   be replaced with a NULL, thus stripping it and reducing the length of
   the string by one.
   -------------------------------------------------------------------------*/

 void
 LogUtils::strip_trailing_newline(char *buf)
 {
   if (buf != nullptr) {
     int len = ::strlen(buf);
     if (len > 0) {
       if (buf[len - 1] == '\n') {
         buf[len - 1] = '\0';
       }
     }
   }
 }

 /*-------------------------------------------------------------------------
   LogUtils::escapify_url_common

   This routine will escapify a URL to remove spaces (and perhaps other ugly
   characters) from a URL and replace them with a hex escape sequence.
   Since the escapes are larger (multi-byte) than the characters being
   replaced, the string returned will be longer than the string passed.

   This is a worker function called by escapify_url and pure_escapify_url.  These
   functions differ on whether the function tries to detect and avoid
   double URL encoding (escapify_url) or not (pure_escapify_url)
   -------------------------------------------------------------------------*/

 namespace
 {
 char *
 escapify_url_common(Arena *arena, char *url, size_t len_in, int *len_out, char *dst, size_t dst_size, const unsigned char *map,
                     bool pure_escape)
 {
   // codes_to_escape is a bitmap encoding the codes that should be escaped.
   // These are all the codes defined in section 2.4.3 of RFC 2396
   // (control, space, delims, and unwise) plus the tilde. In RFC 2396
   // the tilde is an "unreserved" character, but we escape it because
   // historically this is what the traffic_server has done.
   // Note that we leave codes beyond 127 unmodified.
   //
   static const unsigned char codes_to_escape[32] = {
     0xFF, 0xFF, 0xFF,
     0xFF,             // control
     0xB4,             // space " # %
     0x00, 0x00,       //
     0x0A,             // < >
     0x00, 0x00, 0x00, //
     0x1E, 0x80,       // [ \ ] ^ `
     0x00, 0x00,       //
     0x1F,             // { | } ~ DEL
     0x00, 0x00, 0x00,
     0x00, // all non-ascii characters unmodified
     0x00, 0x00, 0x00,
     0x00, //               .
     0x00, 0x00, 0x00,
     0x00, //               .
     0x00, 0x00, 0x00,
     0x00 //               .
   };

   static char hex_digit[16] = {'0', '1', '2', '3', '4', '5', '6', '7', '8', '9', 'A', 'B', 'C', 'D', 'E', 'F'};

   if (!url || (dst && dst_size < len_in)) {
     *len_out = 0;
     return nullptr;
   }

   if (!map) {
     map = codes_to_escape;
   }

   // Count specials in the url, assuming that there won't be any.
   //
   int count        = 0;
   char *p          = url;
   char *in_url_end = url + len_in;

   while (p < in_url_end) {
     unsigned char c = *p;
     if (map[c / 8] & (1 << (7 - c % 8))) {
       ++count;
     }
     ++p;
   }

   if (!count) {
     // The common case, no escapes, so just return the source string.
     //
     *len_out = len_in;
     if (dst) {
       ink_strlcpy(dst, url, dst_size);
     }
     return url;
   }

   // For each special char found, we'll need an escape string, which is
   // three characters long.  Count this and allocate the string required.
   //
   // make sure we take into account the characters we are substituting
   // for when we calculate out_len !!! in other words,
   // out_len = len_in + 3*count - count
   //
   size_t out_len = len_in + 2 * count;

   if (dst && out_len > dst_size) {
     *len_out = 0;
     return nullptr;
   }

   // To play it safe, we null terminate the string we return in case
   // a module that expects null-terminated strings calls escapify_url,
   // so we allocate an extra byte for the EOS
   //
   char *new_url;

   if (dst) {
     new_url = dst;
   } else {
     new_url = arena->str_alloc(out_len + 1);
   }

   char *from = url;
   char *to   = new_url;

   while (from < in_url_end) {
     unsigned char c = *from;
     if (map[c / 8] & (1 << (7 - c % 8))) {
       /*
        * If two characters following a '%' don't need to be encoded, then it must
        * mean that the three character sequence is already encoded.  Just copy it over.
        */
       if (!pure_escape && (*from == '%') && ((from + 2) < in_url_end)) {
         unsigned char c1   = *(from + 1);
         unsigned char c2   = *(from + 2);
         bool needsEncoding = ((map[c1 / 8] & (1 << (7 - c1 % 8))) || (map[c2 / 8] & (1 << (7 - c2 % 8))));
         if (!needsEncoding) {
           out_len -= 2;
           Debug("log-utils", "character already encoded..skipping %c, %c, %c", *from, *(from + 1), *(from + 2));
           *to++ = *from++;
           continue;
         }
       }

       *to++ = '%';
       *to++ = hex_digit[c / 16];
       *to++ = hex_digit[c % 16];
     } else {
       *to++ = *from;
     }
     from++;
   }
   *to = '\0'; // null terminate string

   *len_out = out_len;
   return new_url;
 }
 } // namespace

 char *
 LogUtils::escapify_url(Arena *arena, char *url, size_t len_in, int *len_out, char *dst, size_t dst_size, const unsigned char *map)
 {
   return escapify_url_common(arena, url, len_in, len_out, dst, dst_size, map, false);
 }

 char *
 LogUtils::pure_escapify_url(Arena *arena, char *url, size_t len_in, int *len_out, char *dst, size_t dst_size,
                             const unsigned char *map)
 {
   return escapify_url_common(arena, url, len_in, len_out, dst, dst_size, map, true);
 }

 /*-------------------------------------------------------------------------
   LogUtils::remove_content_type_attributes

   HTTP allows content types to have attributes following the main type and
   subtype.  For example, attributes of text/html might be charset=iso-8859.
   The content type attributes are not logged, so this function strips them
   from the given buffer, if present.
   -------------------------------------------------------------------------*/

 void
 LogUtils::remove_content_type_attributes(char *type_str, int *type_len)
 {
   if (!type_str) {
     *type_len = 0;
     return;
   }
   // Look for a semicolon and cut out everything after that
   //
   char *p = static_cast<char *>(memchr(type_str, ';', *type_len));
   if (p) {
     *type_len = p - type_str;
   }
 }

 /*
 int
 LogUtils::ip_to_str (unsigned ip, char *str, unsigned len)
 {
     int ret = snprintf (str, len, "%u.%u.%u.%u",
                             (ip >> 24) & 0xff,
                             (ip >> 16) & 0xff,
                             (ip >> 8)  & 0xff,
                             ip         & 0xff);

     return ((ret <= (int)len)? ret : (int)len);
 }
 */

 // return the seconds remaining until the time of the next roll given
 // the current time, the rolling offset, and the rolling interval
 //
 int
 LogUtils::seconds_to_next_roll(time_t time_now, int rolling_offset, int rolling_interval)
 {
   struct tm lt;
   ink_localtime_r((const time_t *)&time_now, &lt);
   int sidl = lt.tm_sec + lt.tm_min * 60 + lt.tm_hour * 3600;
   int tr   = rolling_offset * 3600;
   return ((tr >= sidl ? (tr - sidl) % rolling_interval : (86400 - (sidl - tr)) % rolling_interval));
 }

 ts::TextView
 LogUtils::get_unrolled_filename(ts::TextView rolled_filename)
 {
   auto unrolled_name = rolled_filename;

   // A rolled log will look something like:
   //   squid.log_some.hostname.com.20191029.18h15m02s-20191029.18h30m02s.old
   auto suffix = rolled_filename;

   suffix.remove_prefix_at('.');
   // Using the above squid.log example, suffix now looks like:
   //   log_some.hostname.com.20191029.18h15m02s-20191029.18h30m02s.old

   // Some suffixes do not have the hostname.  Rolled diags.log files will look
   // something like this, for example:
   //   diags.log.20191114.21h43m16s-20191114.21h43m17s.old
   //
   // For these, the second delimeter will be a period. For this reason, we also
   // split_prefix_at with a period as well.
   if (suffix.split_prefix_at('_') || suffix.split_prefix_at('.')) {
     // ' + 1' to remove the '_' or second '.':
     return unrolled_name.remove_suffix(suffix.size() + 1);
   }
   // If there isn't a '.' or an '_' after the first '.', then this
   // doesn't look like a rolled file.
   return rolled_filename;
 }

 // Checks if the file pointed to by full_filename either is a regular
 // file or a pipe and has write permission, or, if the file does not
 // exist, if the path prefix of full_filename names a directory that
 // has both execute and write permissions, so there will be no problem
 // creating the file. If the size_bytes pointer is not NULL, it returns
 // the size of the file through it.
 // Also checks the current size limit for the file. If there is a
 // limit and has_size_limit is not null, *has_size_limit is set to
 // true. If there is no limit and has_size_limit is not null,
 // *has_size_limit is set to false.  If there is a limit and if the
 // current_size_limit_bytes pointer is not null, it returns the limit
 // through it.
 //
 // returns:
 //  0 on success
 // -1 on system error (no permission, etc.)
 //  1 if the file full_filename points to is neither a regular file
 //    nor a pipe
 //
 int
 LogUtils::file_is_writeable(const char *full_filename, off_t *size_bytes, bool *has_size_limit, uint64_t *current_size_limit_bytes)
 {
   int ret_val = 0;
   int e;
   struct stat stat_data;

   e = stat(full_filename, &stat_data);
   if (e == 0) {
     // stat succeeded, check if full_filename points to a regular
     // file/fifo and if so, check if file has write permission
     //
     if (!(S_ISREG(stat_data.st_mode) || S_ISFIFO(stat_data.st_mode))) {
       ret_val = 1;
     } else if (!(stat_data.st_mode & S_IWUSR)) {
       errno   = EACCES;
       ret_val = -1;
     }
     if (size_bytes) {
       *size_bytes = stat_data.st_size;
     }
   } else {
     // stat failed
     //
     if (errno != ENOENT) {
       // can't stat file
       //
       ret_val = -1;
     } else {
       // file does not exist, check that the prefix is a directory with
       // write and execute permissions

       char *dir;
       char *prefix = nullptr;

       // search for forward or reverse slash in full_filename
       // starting from the end
       //
       const char *slash = strrchr(full_filename, '/');
       if (slash) {
         size_t prefix_len = slash - full_filename + 1;
         prefix            = new char[prefix_len + 1];
         memcpy(prefix, full_filename, prefix_len);
         prefix[prefix_len] = 0;
         dir                = prefix;
       } else {
         dir = (char *)"."; // full_filename has no prefix, use .
       }

       // check if directory is executable and writeable
       //
       e = access(dir, X_OK | W_OK);
       if (e < 0) {
         ret_val = -1;
       } else {
         if (size_bytes) {
           *size_bytes = 0;
         }
       }

       if (prefix) {
         delete[] prefix;
       }
     }
   }

   // check for the current filesize limit
   //
   if (ret_val == 0) {
     struct rlimit limit_data;
     e = getrlimit(RLIMIT_FSIZE, &limit_data);
     if (e < 0) {
       ret_val = -1;
     } else {
       if (limit_data.rlim_cur != static_cast<rlim_t> RLIM_INFINITY) {
         if (has_size_limit) {
           *has_size_limit = true;
         }
         if (current_size_limit_bytes) {
           *current_size_limit_bytes = limit_data.rlim_cur;
         }
       } else {
         if (has_size_limit) {
           *has_size_limit = false;
         }
       }
     }
   }

   return ret_val;
 }

 namespace
 {
 // Get a string out of a MIMEField using one of its member functions, and put it into a buffer writer, terminated with a nul.
 //
 void
 marshalStr(ts::FixedBufferWriter &bw, const MIMEField &mf, const char *(MIMEField::*get_func)(int *length) const)
 {
   int length;
   const char *data = (mf.*get_func)(&length);

   if (!data or (*data == '\0')) {
     // Empty string.  This is a problem, since it would result in two successive nul characters, which indicates the end of the
     // marshaled hearer.  Change the string to a single blank character.

     static const char Blank[] = " ";
     data                      = Blank;
     length                    = 1;
   }

   bw << std::string_view(data, length) << '\0';
 }

 void
 unmarshalStr(ts::FixedBufferWriter &bw, const char *&data)
 {
   bw << '{';

   while (*data) {
     bw << *(data++);
   }

   // Skip over terminal nul.
   ++data;

   bw << '}';
 }

 } // end anonymous namespace

 namespace LogUtils
 {
 // Marshals header tags and values together, with a single terminating nul character.  Returns buffer space required.  'buf' points
 // to where to put the marshaled data.  If 'buf' is null, no data is marshaled, but the function returns the amount of space that
 // would have been used.
 //
 int
 marshalMimeHdr(MIMEHdr *hdr, char *buf)
 {
   std::size_t bwSize = buf ? SIZE_MAX : 0;

   ts::FixedBufferWriter bw(buf, bwSize);

   if (hdr) {
     MIMEFieldIter mfIter;
     const MIMEField *mfp = hdr->iter_get_first(&mfIter);

     while (mfp) {
       marshalStr(bw, *mfp, &MIMEField::name_get);
       marshalStr(bw, *mfp, &MIMEField::value_get);

       mfp = hdr->iter_get_next(&mfIter);
     }
   }

   bw << '\0';

   return int(INK_ALIGN_DEFAULT(bw.extent()));
 }

 // Unmarshaled/printable format is {{{tag1}:{value1}}{{tag2}:{value2}} ... }
 //
 int
 unmarshalMimeHdr(char **buf, char *dest, int destLength)
 {
   ink_assert(*buf != nullptr);

   const char *data = *buf;

   ink_assert(data != nullptr);

   ts::FixedBufferWriter bw(dest, destLength);

   bw << '{';

   int pairEndFallback{0}, pairEndFallback2{0}, pairSeparatorFallback{0};

   while (*data) {
     if (!bw.error()) {
       pairEndFallback2 = pairEndFallback;
       pairEndFallback  = bw.size();
     }

     // Add open bracket of pair.
     //
     bw << '{';

     // Unmarshal field name.
     unmarshalStr(bw, data);

     bw << ':';

     if (!bw.error()) {
       pairSeparatorFallback = bw.size();
     }

     // Unmarshal field value.
     unmarshalStr(bw, data);

     // Add close bracket of pair.
     bw << '}';

   } // end for loop

   bw << '}';

   if (bw.error()) {
     // The output buffer wasn't big enough.

     static std::string_view FULL_ELLIPSES("...}}}");

     if ((pairSeparatorFallback > pairEndFallback) and ((pairSeparatorFallback + 7) <= destLength)) {
       // In the report, we can show the existence of the last partial tag/value pair, and maybe part of the value.  If we only
       // show part of the value, we want to end it with an elipsis, to make it clear it's not complete.

       bw.reduce(destLength - FULL_ELLIPSES.size());
       bw << FULL_ELLIPSES;

     } else if (pairEndFallback and (pairEndFallback < destLength)) {
       bw.reduce(pairEndFallback);
       bw << '}';

     } else if ((pairSeparatorFallback > pairEndFallback2) and ((pairSeparatorFallback + 7) <= destLength)) {
       bw.reduce(destLength - FULL_ELLIPSES.size());
       bw << FULL_ELLIPSES;

     } else if (pairEndFallback2 and (pairEndFallback2 < destLength)) {
       bw.reduce(pairEndFallback2);
       bw << '}';

     } else if (destLength > 1) {
       bw.reduce(1);
       bw << '}';

     } else {
       bw.reduce(0);
     }
   }

   *buf += INK_ALIGN_DEFAULT(data - *buf + 1);

   return bw.size();
 }

 } // end namespace LogUtils
	/** @file

	This file contains a set of utility routines that are used throughout the
	logging implementation.

	@section license License

	Licensed to the Apache Software Foundation (ASF) under one
	or more contributor license agreements. See the NOTICE file
	distributed with this work for additional information
	regarding copyright ownership. The ASF licenses this file
	to you under the Apache License, Version 2.0 (the
	"License"); you may not use this file except in compliance
	with the License. You may obtain a copy of the License at

	http://www.apache.org/licenses/LICENSE-2.0

	Unless required by applicable law or agreed to in writing, software
	distributed under the License is distributed on an "AS IS" BASIS,
	WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
	See the License for the specific language governing permissions and
	limitations under the License.
	*/

	#include <tscore/ink_align.h>
	#include "tscore/ink_config.h"
	#include "tscore/ink_string.h"
	#include <tscore/ink_assert.h>
	#include <tscore/BufferWriter.h>

	#ifdef TEST_LOG_UTILS

	#include "unit-tests/test_LogUtils.h"

	#else

	#include <MIME.h>

	#endif

	#include <cassert>
	#include <cstdio>
	#include <cstdlib>
	#include <cstdarg>
	#include <cstring>
	#include <ctime>
	#include <string_view>
	#include <cstdint>

	#include <sys/time.h>
	#include <sys/types.h>
	#include <sys/stat.h>
	#include <unistd.h>
	#include <sys/socket.h>
	#include <netinet/in.h>
	#include <arpa/inet.h>
	#include <netdb.h>

	#include "records/P_RecProcess.h"
	// REC_SIGNAL_LOGGING_ERROR is defined in I_RecSignals.h
	// REC_SIGNAL_LOGGING_WARNING is defined in I_RecSignals.h

	#include "LogUtils.h"
	#include "LogLimits.h"

	/*-------------------------------------------------------------------------
	LogUtils::timestamp_to_str

	This routine will convert a timestamp (seconds) into a short string,
	of the format "%Y%m%d.%Hh%Mm%Ss".

	Since the resulting buffer is passed in, this routine is thread-safe.
	Return value is the number of characters placed into the array, not
	including the NULL.
	-------------------------------------------------------------------------*/

	int
	LogUtils::timestamp_to_str(long timestamp, char *buf, int size)
	{
	static const char *format_str = "%Y%m%d.%Hh%Mm%Ss";
	struct tm res;
	struct tm *tms;
	tms = ink_localtime_r((const time_t *)&timestamp, &res);
	return strftime(buf, size, format_str, tms);
	}

	/*-------------------------------------------------------------------------
	LogUtils::timestamp_to_netscape_str

	This routine will convert a timestamp (seconds) into a string compatible
	with the Netscape logging formats.

	This routine is intended to be called from the (single) logging thread,
	and is therefore NOT MULTITHREADED SAFE. There is a single, static,
	string buffer that the time string is constructed into and returned.
	-------------------------------------------------------------------------*/

	char *
	LogUtils::timestamp_to_netscape_str(long timestamp)
	{
	static char timebuf[64]; // NOTE: not MT safe
	static long last_timestamp = 0;

	// safety check
	if (timestamp < 0) {
	static char bad_time[] = "Bad timestamp";
	return bad_time;
	}
	//
	// since we may have many entries per second, lets only do the
	// formatting if we actually have a new timestamp.
	//

	if (timestamp != last_timestamp) {
	//
	// most of this garbage is simply to find out the offset from GMT,
	// taking daylight savings into account.
	//
	struct tm res;
	struct tm tms = ink_localtime_r((const time_t )&timestamp, &res);
	#if defined(solaris)
	long zone = (tms->tm_isdst > 0) ? altzone : timezone;
	#else
	long zone = -tms->tm_gmtoff; // double negative!
	#endif
	int offset;
	char sign;

	if (zone >= 0) {
	offset = zone / 60;
	sign = '-';
	} else {
	offset = zone / -60;
	sign = '+';
	}

	static char gmtstr[16];
	int glen = snprintf(gmtstr, 16, "%c%.2d%.2d", sign, offset / 60, offset % 60);

	strftime(timebuf, 64 - glen, "%d/%b/%Y:%H:%M:%S ", tms);
	ink_strlcat(timebuf, gmtstr, sizeof(timebuf));
	last_timestamp = timestamp;
	}
	return timebuf;
	}

	/*-------------------------------------------------------------------------
	LogUtils::timestamp_to_date_str

	This routine will convert a timestamp (seconds) into a W3C compatible
	date string.
	-------------------------------------------------------------------------*/

	char *
	LogUtils::timestamp_to_date_str(long timestamp)
	{
	static char timebuf[64]; // NOTE: not MT safe
	static long last_timestamp = 0;

	// safety check
	if (timestamp < 0) {
	static char bad_time[] = "Bad timestamp";
	return bad_time;
	}
	//
	// since we may have many entries per second, lets only do the
	// formatting if we actually have a new timestamp.
	//

	if (timestamp != last_timestamp) {
	struct tm res;
	struct tm tms = ink_localtime_r((const time_t )&timestamp, &res);
	strftime(timebuf, 64, "%Y-%m-%d", tms);
	last_timestamp = timestamp;
	}
	return timebuf;
	}

	/*-------------------------------------------------------------------------
	LogUtils::timestamp_to_time_str

	This routine will convert a timestamp (seconds) into a W3C compatible
	time string.
	-------------------------------------------------------------------------*/

	char *
	LogUtils::timestamp_to_time_str(long timestamp)
	{
	static char timebuf[64]; // NOTE: not MT safe
	static long last_timestamp = 0;

	// safety check
	if (timestamp < 0) {
	static char bad_time[] = "Bad timestamp";
	return bad_time;
	}
	//
	// since we may have many entries per second, lets only do the
	// formatting if we actually have a new timestamp.
	//

	if (timestamp != last_timestamp) {
	struct tm res;
	struct tm tms = ink_localtime_r((const time_t )&timestamp, &res);
	strftime(timebuf, 64, "%H:%M:%S", tms);
	last_timestamp = timestamp;
	}
	return timebuf;
	}

	/*-------------------------------------------------------------------------
	LogUtils::manager_alarm

	This routine provides a convenient abstraction for sending the traffic
	server manager process an alarm. The logging system can send
	LOG_ALARM_N_TYPES different types of alarms, as defined in LogUtils.h.
	Subsequent alarms of the same type will override the previous alarm
	entry.
	-------------------------------------------------------------------------*/

	void
	LogUtils::manager_alarm(LogUtils::AlarmType alarm_type, const char *msg, ...)
	{
	char msg_buf[LOG_MAX_FORMATTED_LINE];

	ink_assert(alarm_type >= 0 && alarm_type < LogUtils::LOG_ALARM_N_TYPES);

	if (msg == nullptr) {
	snprintf(msg_buf, sizeof(msg_buf), "No Message");
	} else {
	va_list ap;
	va_start(ap, msg);
	vsnprintf(msg_buf, LOG_MAX_FORMATTED_LINE, msg, ap);
	va_end(ap);
	}

	switch (alarm_type) {
	case LogUtils::LOG_ALARM_ERROR:
	RecSignalManager(REC_SIGNAL_LOGGING_ERROR, msg_buf);
	break;

	case LogUtils::LOG_ALARM_WARNING:
	RecSignalManager(REC_SIGNAL_LOGGING_WARNING, msg_buf);
	break;

	default:
	ink_assert(false);
	}
	}

	/*-------------------------------------------------------------------------
	LogUtils::strip_trailing_newline

	This routine examines the given string buffer to see if the last
	character before the trailing NULL is a newline ('\n'). If so, it will
	be replaced with a NULL, thus stripping it and reducing the length of
	the string by one.
	-------------------------------------------------------------------------*/

	void
	LogUtils::strip_trailing_newline(char *buf)
	{
	if (buf != nullptr) {
	int len = ::strlen(buf);
	if (len > 0) {
	if (buf[len - 1] == '\n') {
	buf[len - 1] = '\0';
	}
	}
	}
	}

	/*-------------------------------------------------------------------------
	LogUtils::escapify_url_common

	This routine will escapify a URL to remove spaces (and perhaps other ugly
	characters) from a URL and replace them with a hex escape sequence.
	Since the escapes are larger (multi-byte) than the characters being
	replaced, the string returned will be longer than the string passed.

	This is a worker function called by escapify_url and pure_escapify_url. These
	functions differ on whether the function tries to detect and avoid
	double URL encoding (escapify_url) or not (pure_escapify_url)
	-------------------------------------------------------------------------*/

	namespace
	{
	char *
	escapify_url_common(Arena arena, char url, size_t len_in, int len_out, char dst, size_t dst_size, const unsigned char *map,
	bool pure_escape)
	{
	// codes_to_escape is a bitmap encoding the codes that should be escaped.
	// These are all the codes defined in section 2.4.3 of RFC 2396
	// (control, space, delims, and unwise) plus the tilde. In RFC 2396
	// the tilde is an "unreserved" character, but we escape it because
	// historically this is what the traffic_server has done.
	// Note that we leave codes beyond 127 unmodified.
	//
	static const unsigned char codes_to_escape[32] = {
	0xFF, 0xFF, 0xFF,
	0xFF, // control
	0xB4, // space " # %
	0x00, 0x00, //
	0x0A, // < >
	0x00, 0x00, 0x00, //
	0x1E, 0x80, // [ \ ] ^ `
	0x00, 0x00, //
	0x1F, // { \| } ~ DEL
	0x00, 0x00, 0x00,
	0x00, // all non-ascii characters unmodified
	0x00, 0x00, 0x00,
	0x00, // .
	0x00, 0x00, 0x00,
	0x00, // .
	0x00, 0x00, 0x00,
	0x00 // .
	};

	static char hex_digit[16] = {'0', '1', '2', '3', '4', '5', '6', '7', '8', '9', 'A', 'B', 'C', 'D', 'E', 'F'};

	if (!url \|\| (dst && dst_size < len_in)) {
	*len_out = 0;
	return nullptr;
	}

	if (!map) {
	map = codes_to_escape;
	}

	// Count specials in the url, assuming that there won't be any.
	//
	int count = 0;
	char *p = url;
	char *in_url_end = url + len_in;

	while (p < in_url_end) {
	unsigned char c = *p;
	if (map[c / 8] & (1 << (7 - c % 8))) {
	++count;
	}
	++p;
	}

	if (!count) {
	// The common case, no escapes, so just return the source string.
	//
	*len_out = len_in;
	if (dst) {
	ink_strlcpy(dst, url, dst_size);
	}
	return url;
	}

	// For each special char found, we'll need an escape string, which is
	// three characters long. Count this and allocate the string required.
	//
	// make sure we take into account the characters we are substituting
	// for when we calculate out_len !!! in other words,
	// out_len = len_in + 3*count - count
	//
	size_t out_len = len_in + 2 * count;

	if (dst && out_len > dst_size) {
	*len_out = 0;
	return nullptr;
	}

	// To play it safe, we null terminate the string we return in case
	// a module that expects null-terminated strings calls escapify_url,
	// so we allocate an extra byte for the EOS
	//
	char *new_url;

	if (dst) {
	new_url = dst;
	} else {
	new_url = arena->str_alloc(out_len + 1);
	}

	char *from = url;
	char *to = new_url;

	while (from < in_url_end) {
	unsigned char c = *from;
	if (map[c / 8] & (1 << (7 - c % 8))) {
	/*
	* If two characters following a '%' don't need to be encoded, then it must
	* mean that the three character sequence is already encoded. Just copy it over.
	*/
	if (!pure_escape && (*from == '%') && ((from + 2) < in_url_end)) {
	unsigned char c1 = *(from + 1);
	unsigned char c2 = *(from + 2);
	bool needsEncoding = ((map[c1 / 8] & (1 << (7 - c1 % 8))) \|\| (map[c2 / 8] & (1 << (7 - c2 % 8))));
	if (!needsEncoding) {
	out_len -= 2;
	Debug("log-utils", "character already encoded..skipping %c, %c, %c", from, (from + 1), *(from + 2));
	to++ = from++;
	continue;
	}
	}

	*to++ = '%';
	*to++ = hex_digit[c / 16];
	*to++ = hex_digit[c % 16];
	} else {
	to++ = from;
	}
	from++;
	}
	*to = '\0'; // null terminate string

	*len_out = out_len;
	return new_url;
	}
	} // namespace

	char *
	LogUtils::escapify_url(Arena arena, char url, size_t len_in, int len_out, char dst, size_t dst_size, const unsigned char *map)
	{
	return escapify_url_common(arena, url, len_in, len_out, dst, dst_size, map, false);
	}

	char *
	LogUtils::pure_escapify_url(Arena arena, char url, size_t len_in, int len_out, char dst, size_t dst_size,
	const unsigned char *map)
	{
	return escapify_url_common(arena, url, len_in, len_out, dst, dst_size, map, true);
	}

	/*-------------------------------------------------------------------------
	LogUtils::remove_content_type_attributes

	HTTP allows content types to have attributes following the main type and
	subtype. For example, attributes of text/html might be charset=iso-8859.
	The content type attributes are not logged, so this function strips them
	from the given buffer, if present.
	-------------------------------------------------------------------------*/

	void
	LogUtils::remove_content_type_attributes(char type_str, int type_len)
	{
	if (!type_str) {
	*type_len = 0;
	return;
	}
	// Look for a semicolon and cut out everything after that
	//
	char p = static_cast<char >(memchr(type_str, ';', *type_len));
	if (p) {
	*type_len = p - type_str;
	}
	}

	/*
	int
	LogUtils::ip_to_str (unsigned ip, char *str, unsigned len)
	{
	int ret = snprintf (str, len, "%u.%u.%u.%u",
	(ip >> 24) & 0xff,
	(ip >> 16) & 0xff,
	(ip >> 8) & 0xff,
	ip & 0xff);

	return ((ret <= (int)len)? ret : (int)len);
	}
	*/

	// return the seconds remaining until the time of the next roll given
	// the current time, the rolling offset, and the rolling interval
	//
	int
	LogUtils::seconds_to_next_roll(time_t time_now, int rolling_offset, int rolling_interval)
	{
	struct tm lt;
	ink_localtime_r((const time_t *)&time_now, &lt);
	int sidl = lt.tm_sec + lt.tm_min * 60 + lt.tm_hour * 3600;
	int tr = rolling_offset * 3600;
	return ((tr >= sidl ? (tr - sidl) % rolling_interval : (86400 - (sidl - tr)) % rolling_interval));
	}

	ts::TextView
	LogUtils::get_unrolled_filename(ts::TextView rolled_filename)
	{
	auto unrolled_name = rolled_filename;

	// A rolled log will look something like:
	// squid.log_some.hostname.com.20191029.18h15m02s-20191029.18h30m02s.old
	auto suffix = rolled_filename;

	suffix.remove_prefix_at('.');
	// Using the above squid.log example, suffix now looks like:
	// log_some.hostname.com.20191029.18h15m02s-20191029.18h30m02s.old

	// Some suffixes do not have the hostname. Rolled diags.log files will look
	// something like this, for example:
	// diags.log.20191114.21h43m16s-20191114.21h43m17s.old
	//
	// For these, the second delimeter will be a period. For this reason, we also
	// split_prefix_at with a period as well.
	if (suffix.split_prefix_at('_') \|\| suffix.split_prefix_at('.')) {
	// ' + 1' to remove the '_' or second '.':
	return unrolled_name.remove_suffix(suffix.size() + 1);
	}
	// If there isn't a '.' or an '_' after the first '.', then this
	// doesn't look like a rolled file.
	return rolled_filename;
	}

	// Checks if the file pointed to by full_filename either is a regular
	// file or a pipe and has write permission, or, if the file does not
	// exist, if the path prefix of full_filename names a directory that
	// has both execute and write permissions, so there will be no problem
	// creating the file. If the size_bytes pointer is not NULL, it returns
	// the size of the file through it.
	// Also checks the current size limit for the file. If there is a
	// limit and has_size_limit is not null, *has_size_limit is set to
	// true. If there is no limit and has_size_limit is not null,
	// *has_size_limit is set to false. If there is a limit and if the
	// current_size_limit_bytes pointer is not null, it returns the limit
	// through it.
	//
	// returns:
	// 0 on success
	// -1 on system error (no permission, etc.)
	// 1 if the file full_filename points to is neither a regular file
	// nor a pipe
	//
	int
	LogUtils::file_is_writeable(const char full_filename, off_t size_bytes, bool has_size_limit, uint64_t current_size_limit_bytes)
	{
	int ret_val = 0;
	int e;
	struct stat stat_data;

	e = stat(full_filename, &stat_data);
	if (e == 0) {
	// stat succeeded, check if full_filename points to a regular
	// file/fifo and if so, check if file has write permission
	//
	if (!(S_ISREG(stat_data.st_mode) \|\| S_ISFIFO(stat_data.st_mode))) {
	ret_val = 1;
	} else if (!(stat_data.st_mode & S_IWUSR)) {
	errno = EACCES;
	ret_val = -1;
	}
	if (size_bytes) {
	*size_bytes = stat_data.st_size;
	}
	} else {
	// stat failed
	//
	if (errno != ENOENT) {
	// can't stat file
	//
	ret_val = -1;
	} else {
	// file does not exist, check that the prefix is a directory with
	// write and execute permissions

	char *dir;
	char *prefix = nullptr;

	// search for forward or reverse slash in full_filename
	// starting from the end
	//
	const char *slash = strrchr(full_filename, '/');
	if (slash) {
	size_t prefix_len = slash - full_filename + 1;
	prefix = new char[prefix_len + 1];
	memcpy(prefix, full_filename, prefix_len);
	prefix[prefix_len] = 0;
	dir = prefix;
	} else {
	dir = (char *)"."; // full_filename has no prefix, use .
	}

	// check if directory is executable and writeable
	//
	e = access(dir, X_OK \| W_OK);
	if (e < 0) {
	ret_val = -1;
	} else {
	if (size_bytes) {
	*size_bytes = 0;
	}
	}

	if (prefix) {
	delete[] prefix;
	}
	}
	}

	// check for the current filesize limit
	//
	if (ret_val == 0) {
	struct rlimit limit_data;
	e = getrlimit(RLIMIT_FSIZE, &limit_data);
	if (e < 0) {
	ret_val = -1;
	} else {
	if (limit_data.rlim_cur != static_cast<rlim_t> RLIM_INFINITY) {
	if (has_size_limit) {
	*has_size_limit = true;
	}
	if (current_size_limit_bytes) {
	*current_size_limit_bytes = limit_data.rlim_cur;
	}
	} else {
	if (has_size_limit) {
	*has_size_limit = false;
	}
	}
	}
	}

	return ret_val;
	}

	namespace
	{
	// Get a string out of a MIMEField using one of its member functions, and put it into a buffer writer, terminated with a nul.
	//
	void
	marshalStr(ts::FixedBufferWriter &bw, const MIMEField &mf, const char (MIMEField::get_func)(int *length) const)
	{
	int length;
	const char data = (mf.get_func)(&length);

	if (!data or (*data == '\0')) {
	// Empty string. This is a problem, since it would result in two successive nul characters, which indicates the end of the
	// marshaled hearer. Change the string to a single blank character.

	static const char Blank[] = " ";
	data = Blank;
	length = 1;
	}

	bw << std::string_view(data, length) << '\0';
	}

	void
	unmarshalStr(ts::FixedBufferWriter &bw, const char *&data)
	{
	bw << '{';

	while (*data) {
	bw << *(data++);
	}

	// Skip over terminal nul.
	++data;

	bw << '}';
	}

	} // end anonymous namespace

	namespace LogUtils
	{
	// Marshals header tags and values together, with a single terminating nul character. Returns buffer space required. 'buf' points
	// to where to put the marshaled data. If 'buf' is null, no data is marshaled, but the function returns the amount of space that
	// would have been used.
	//
	int
	marshalMimeHdr(MIMEHdr hdr, char buf)
	{
	std::size_t bwSize = buf ? SIZE_MAX : 0;

	ts::FixedBufferWriter bw(buf, bwSize);

	if (hdr) {
	MIMEFieldIter mfIter;
	const MIMEField *mfp = hdr->iter_get_first(&mfIter);

	while (mfp) {
	marshalStr(bw, *mfp, &MIMEField::name_get);
	marshalStr(bw, *mfp, &MIMEField::value_get);

	mfp = hdr->iter_get_next(&mfIter);
	}
	}

	bw << '\0';

	return int(INK_ALIGN_DEFAULT(bw.extent()));
	}

	// Unmarshaled/printable format is {{{tag1}:{value1}}{{tag2}:{value2}} ... }
	//
	int
	unmarshalMimeHdr(char *buf, char dest, int destLength)
	{
	ink_assert(*buf != nullptr);

	const char data = buf;

	ink_assert(data != nullptr);

	ts::FixedBufferWriter bw(dest, destLength);

	bw << '{';

	int pairEndFallback{0}, pairEndFallback2{0}, pairSeparatorFallback{0};

	while (*data) {
	if (!bw.error()) {
	pairEndFallback2 = pairEndFallback;
	pairEndFallback = bw.size();
	}

	// Add open bracket of pair.
	//
	bw << '{';

	// Unmarshal field name.
	unmarshalStr(bw, data);

	bw << ':';

	if (!bw.error()) {
	pairSeparatorFallback = bw.size();
	}

	// Unmarshal field value.
	unmarshalStr(bw, data);

	// Add close bracket of pair.
	bw << '}';

	} // end for loop

	bw << '}';

	if (bw.error()) {
	// The output buffer wasn't big enough.

	static std::string_view FULL_ELLIPSES("...}}}");

	if ((pairSeparatorFallback > pairEndFallback) and ((pairSeparatorFallback + 7) <= destLength)) {
	// In the report, we can show the existence of the last partial tag/value pair, and maybe part of the value. If we only
	// show part of the value, we want to end it with an elipsis, to make it clear it's not complete.

	bw.reduce(destLength - FULL_ELLIPSES.size());
	bw << FULL_ELLIPSES;

	} else if (pairEndFallback and (pairEndFallback < destLength)) {
	bw.reduce(pairEndFallback);
	bw << '}';

	} else if ((pairSeparatorFallback > pairEndFallback2) and ((pairSeparatorFallback + 7) <= destLength)) {
	bw.reduce(destLength - FULL_ELLIPSES.size());
	bw << FULL_ELLIPSES;

	} else if (pairEndFallback2 and (pairEndFallback2 < destLength)) {
	bw.reduce(pairEndFallback2);
	bw << '}';

	} else if (destLength > 1) {
	bw.reduce(1);
	bw << '}';

	} else {
	bw.reduce(0);
	}
	}

	buf += INK_ALIGN_DEFAULT(data - buf + 1);

	return bw.size();
	}

	} // end namespace LogUtils