RubyGems - log2json - Versions diffs - 0.1.11 → 0.1.12 - Mend

log2json 0.1.11 → 0.1.12

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (9) hide show

data/bin/redis2disk +96 -0
data/bin/tail +0 -0
data/bin/tail-log.sh +18 -5
data/lib/log2json/railslogger.rb +12 -0
data/log2json-loggers.gemspec +1 -1
data/log2json.gemspec +1 -1
data/src/coreutils-8.13_tail.patch +25 -9
data/src/tail.c +9 -1
metadata +3 -2

data/bin/redis2disk ADDED Viewed

@@ -0,0 +1,96 @@
+#!/bin/bash
+#
+# Check every INTERVAL seconds the size of the log2json log queue in Redis,
+# and reduce the queue size if its average rate of change over the INTERVAL
+# is greater than MAX_RATE for CROSS_COUNT times within EVAL_PERIOD seconds.
+#
+# The logs will be saved on disk and can be pushed back to the queue by
+# another script at a slower rate when the queue is empty most of times.
+#
+#
+set -e
+# name of the queue in Redis. Must be a list in Redis.
+QUEUE=${QUEUE:-jsonlogs}
+# average number of log records per second over INTERVAL seconds
+MAX_RATE=${MAX_RATE:-25000}
+# how many times the average rate of change greater than MAX_RATE should happen
+# with in EVAL_PERIOD seconds before we reduce the queue size.
+CROSS_COUNT=${CROSS_COUNT:-2}
+# the length of time(in seconds) within which a "cross-over"
+# is considered valid and so counts toward CROSS_COUNT.
+# It should be a multiple of INTERVAL.
+EVAL_PERIOD=${EVAL_PERIOD:-15}
+# Samples the queue size roughly every INTERVAL seconds.
+# The smaller the more accurate and less chance to miss sudden burst of traffic.
+INTERVAL=${INTERVAL:-5}
+# LUA script for Redis to lpop N log records off the queue.
+LUA_LPOP_KEY_N='
+    local i = tonumber(ARGV[1])
+    local res = {}
+    local length = redis.call("llen",KEYS[1])
+    if length < i then i = length end
+    while (i > 0) do
+    local item = redis.call("lpop", KEYS[1])
+    if (not item) then
+      break
+    end
+    table.insert(res, item)
+    i = i-1
+    end
+    return res
+'
+# folder to store the log records off loaded from the queue
+BATCH_DIR=${BATCH_DIR:-/mnt/redis}
+log() { echo "$(date): $*"; }
+while true
+do
+    if [ $(( $(date +%s) - period_start )) -ge "$EVAL_PERIOD" ]; then
+        period_start=$(date +%s)
+        count=0 # how many times have we crossed MAX_RATE within the period so far.
+                # reset to 0 at the start of a new period or when it reaches CROSS_COUNT.
+        log "New period begins---"
+    fi
+    s2=$(redis-cli llen $QUEUE) # current queue size
+    log "queue size=$s2"
+    if [ "$s1" ]; then
+        delta=$(( s2 - s1 ))
+        rate=$(( delta / INTERVAL ))
+        log "delta=$delta rate=$rate"
+        # if within the period, we have crossed MAX_RATE CROSS_COUNT times
+        # then move the records from the queue to a batch file.
+        if [ "$rate" -gt "$MAX_RATE" ]; then
+            count=$((count + 1))
+            log "MAX_RATE($MAX_RATE/s) crossed! count=$count"
+            if [ "$count" -ge "$CROSS_COUNT" ]; then
+                batch_file=$BATCH_DIR/${QUEUE}_$(date +%Y-%m-%dT%T.%N%z)
+                n_records=$((delta * count))
+                log "CROSS_COUNT($CROSS_COUNT) reached! Off loading $n_records log records to $batch_file ..."
+                redis-cli --eval <(echo "$LUA_LPOP_KEY_N") $QUEUE , $n_records > $batch_file &
+                count=0
+                off_loaded=1
+            fi
+        fi
+    fi
+    if [ "$off_loaded" ]; then
+        s1=$(redis-cli llen $QUEUE)
+        off_loaded=
+    else
+        s1=$s2
+    fi
+    sleep "$INTERVAL"
+done

data/bin/tail CHANGED Viewed

Binary file

data/bin/tail-log.sh CHANGED Viewed

@@ -4,9 +4,17 @@ set -e
 # Find out the absolute path to the tail utility.
 # This is a patched version of the tail utility in GNU coreutils-8.13 compiled for Ubuntu 12.04 LTS.
-# The difference is that if header will be shown(ie, with -v or when multiple files are specified),
-# it will also print "==> file.name <== [event]" to stdout whenever a file truncation or a new file is
-# detected. [event] will be one of "[new_file]" or "[truncated]".
+# With the following differences:
+#
+#   - if header will be shown(ie, with -v or when multiple files are specified),
+#     it will also print "==> file.name <== [event]" to stdout whenever a file truncation or a new file is
+#     detected. [event] will be one of "[new_file]" or "[truncated]".
+#
+#   - It allows the use of multiple -n options. Each -n will apply to the files specified on the
+#     command line in order.(ie, first -n N corresponds to the first file, etc.)
+#     If there are more files listed than the number of -n options, then the last -n applies to the
+#     rest of the files.
+#
 TAIL=$(
 ruby -- - <<'EOF'
   require 'log2json'
@@ -37,12 +45,17 @@ build_tail_args() {
   for fpath in "$@"
   do
     sincedb_path=$SINCEDB_DIR/$fpath.since
+    nlines=$(wc -l "$fpath" | cut -d' ' -f1)
+    nlines=${nlines:-0}
     if [ -r "$sincedb_path" ]; then
       read line < "$sincedb_path"
       t=($line)
       # if inode number is unchanged and the current file size is not smaller
       # then we start tailing from 1 + the line number recorded in the sincedb.
-      if [[ ${t[0]} == $(stat -c "%i" "$fpath") && ${t[1]} -le $(stat -c "%s" "$fpath") ]]; then
+      if [[ ${t[0]} == $(stat -c "%i" "$fpath") &&
+            ${t[1]} -le $(stat -c "%s" "$fpath") &&
+            ${t[2]} -le "$nlines" ]]; then
         TAIL_ARGS[$((i++))]="-n+$((t[2] + 1))"
         # tail -n+N means start tailing from the N-th line of the file
         # and we're even allowed to specify different -n+N for different files!
@@ -54,7 +67,7 @@ build_tail_args() {
     # at this point, no last position was recorded in the SINCEDB for fpath,
     # in this case we'd tail from the end of file.
-    TAIL_ARGS[$((i++))]="-n+$(($(wc -l "$fpath" | cut -d' ' -f1) + 1))"
+    TAIL_ARGS[$((i++))]="-n+$(( nlines + 1 ))"
     # Note: we can't just ask tail to seek to the end here(ie, with -n0) since
     #       then we'd lose track of the line count.
     # Note: if fpath doesn't exist yet, then the above evaluates to "-n+1", which

data/lib/log2json/railslogger.rb CHANGED Viewed

@@ -15,6 +15,16 @@ require 'logger'
 module Log2Json
+  LEVELS = {
+    :debug => Logger::DEBUG,
+    :info => Logger::INFO,
+    :warn => Logger::WARN,
+    :error => Logger::ERROR,
+    :fatal => Logger::FATAL,
+    :unknown => 5
+  }
+  LEVELS.default = Logger::INFO
   def self.log_formatter
     proc do |severity, datetime, progname, msg|
       "#{datetime.strftime('%Y-%m-%dT%H:%M:%S%z')}: [#{severity}] #{$$} #{msg.gsub(/\n/, '#012')}\n"
@@ -37,6 +47,7 @@ module Log2Json
       config.active_record.colorize_logging = false
     end
     logger = ::Logger.new(path)
+    logger.level =  LEVELS[config.log_level]
     logger.formatter = ::Log2Json::log_formatter
     if defined?(ActiveSupport::TaggedLogging)
       ActiveSupport::TaggedLogging.new(logger)
@@ -49,6 +60,7 @@ module Log2Json
   #
   def self.create_custom_unicorn_logger(config)
     logger = ::Logger.new(config.set[:stderr_path])
+    logger.level = Logger::INFO
     logger.formatter = ::Log2Json::log_formatter
     logger
   end

data/log2json-loggers.gemspec CHANGED Viewed

@@ -1,6 +1,6 @@
 Gem::Specification.new do |s|
   s.name        = 'log2json-loggers'
-  s.version     = '0.1.9'
+  s.version     = '0.1.11'
   s.summary     = "Custom loggers for Rails and Unicorn that use log2json's single-line log format."
   s.description = IO.read(File.join(File.dirname(__FILE__), 'README'))
   s.authors     = ['Jack Kuan']

data/log2json.gemspec CHANGED Viewed

@@ -1,6 +1,6 @@
 Gem::Specification.new do |s|
   s.name        = 'log2json'
-  s.version     = '0.1.11'
+  s.version     = '0.1.12'
   s.summary     = "Read, filter and ship logs. ie, poor man's roll-your-own, light-weight logstash replacement."
   s.description = IO.read(File.join(File.dirname(__FILE__), 'README'))
   s.authors     = ['Jack Kuan']

data/src/coreutils-8.13_tail.patch CHANGED Viewed

@@ -1,9 +1,25 @@
-1049a1050,1051
->       if (print_headers)
->         printf ("==> %s <== [new_file]\n", pretty_name (f));
-1171a1174,1175
->                   if (print_headers)
->                     printf ("==> %s <== [truncated]\n", name);
-1286a1291,1292
->       if (print_headers)
->         printf ("==> %s <== [truncated]\n", name);
+83,85d82
+< /* Size of the array that stores the -n option values. */
+< #define MAX_FILE_SKIP_LINES 256
+<
+187,189d183
+< /* Stores the number of lines to skip from the start for each file. */
+< static int n_units_argv[MAX_FILE_SKIP_LINES];
+<
+1056,1057d1049
+<       if (print_headers)
+<         printf ("==> %s <== [new_file]\n", pretty_name (f));
+1180,1181d1171
+<                   if (print_headers)
+<                     printf ("==> %s <== [truncated]\n", name);
+1297,1298d1286
+<       if (print_headers)
+<         printf ("==> %s <== [truncated]\n", name);
+1930d1917
+<   int n_units_argc = 0;
+1962d1948
+<             n_units_argv[n_units_argc++] = *n_units;
+2177c2163
+<     ok &= tail_file (&F[i], i < MAX_FILE_SKIP_LINES ? n_units_argv[i] : n_units);
+---
+>     ok &= tail_file (&F[i], n_units);

data/src/tail.c CHANGED Viewed

@@ -80,6 +80,9 @@
 /* FIXME: make Follow_name the default?  */
 #define DEFAULT_FOLLOW_MODE Follow_descriptor
+/* Size of the array that stores the -n option values. */
+#define MAX_FILE_SKIP_LINES 256
 enum Follow_mode
 {
   /* Follow the name of each file: if the file is renamed, try to reopen
@@ -181,6 +184,9 @@ static bool forever;
 /* If true, count from start of file instead of end.  */
 static bool from_start;
+/* Stores the number of lines to skip from the start for each file. */
+static int n_units_argv[MAX_FILE_SKIP_LINES];
 /* If true, print filename headers.  */
 static bool print_headers;
@@ -1921,6 +1927,7 @@ parse_options (int argc, char **argv,
                double *sleep_interval)
 {
   int c;
+  int n_units_argc = 0;
   while ((c = getopt_long (argc, argv, "c:n:fFqs:v0123456789",
                            long_options, NULL))
@@ -1952,6 +1959,7 @@ parse_options (int argc, char **argv,
                         ? _("invalid number of lines")
                         : _("invalid number of bytes")));
               }
+            n_units_argv[n_units_argc++] = *n_units;
           }
           break;
@@ -2166,7 +2174,7 @@ main (int argc, char **argv)
     xfreopen (NULL, "wb", stdout);
   for (i = 0; i < n_files; i++)
-    ok &= tail_file (&F[i], n_units);
+    ok &= tail_file (&F[i], i < MAX_FILE_SKIP_LINES ? n_units_argv[i] : n_units);
   if (forever && ignore_fifo_and_pipe (F, n_files))
     {

metadata CHANGED Viewed

@@ -1,7 +1,7 @@
 --- !ruby/object:Gem::Specification
 name: log2json
 version: !ruby/object:Gem::Version
-  version: 0.1.11
+  version: 0.1.12
   prerelease:
 platform: ruby
 authors:
@@ -9,7 +9,7 @@ authors:
 autorequire:
 bindir: bin
 cert_chain: []
-date: 2013-10-15 00:00:00.000000000 Z
+date: 2013-10-21 00:00:00.000000000 Z
 dependencies:
 - !ruby/object:Gem::Dependency
   name: jls-grok
@@ -114,6 +114,7 @@ files:
 - README
 - bin/lines2redis
 - bin/nginxlog2json
+- bin/redis2disk
 - bin/redis2es
 - bin/syslog2json
 - bin/tail