#!/usr/bin/mawk -We
# *********************************************************************
# total: sums up selected table columns.
#
# Copyright (c) 2001,2002,2003 Carlo Strozzi
#
# This program is free software; you can redistribute it and/or modify
# it under the terms of the GNU General Public License as published by
# the Free Software Foundation; either version 2 of the License, or
# (at your option) any later version.
#
# This program is distributed in the hope that it will be useful,
# but WITHOUT ANY WARRANTY; without even the implied warranty of
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
# GNU General Public License for more details.
#
# You should have received a copy of the GNU General Public License
# along with this program; if not, write to the Free Software
# Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
#
# *********************************************************************
#  $Id: total,v 1.3 2003/05/23 20:31:53 carlo Exp $

BEGIN {
  NULL = ""; FS = OFS = "\t"; fmt = "%s"

  # Get local settings.
  nosql_install = ENVIRON["NOSQL_INSTALL"]
  stdout = ENVIRON["NOSQL_STDOUT"]
  stderr = ENVIRON["NOSQL_STDERR"]

  # Set default values if necessary.
  if (nosql_install == NULL) nosql_install = "/usr/local/nosql"
  if (stdout == NULL) stdout = "/dev/stdout"
  if (stderr == NULL) stderr = "/dev/stderr"

  while (ARGV[++i] != NULL) {
    if (ARGV[i] == "-l" || ARGV[i] == "--last") pick_last = 1
    else if (ARGV[i] == "-N" || ARGV[i] == "--no-header") no_hdr = 1
    else if (ARGV[i] == "-r" || ARGV[i] == "--report") report = 1
    else if (ARGV[i] == "-i" || ARGV[i] == "--input") i_file = ARGV[++i]
    else if (ARGV[i] == "-o" || ARGV[i] == "--output") o_file = ARGV[++i]
    else if (ARGV[i] == "-T" || ARGV[i] == "--total") gtcol = ARGV[++i]
    else if (ARGV[i] == "-c" || ARGV[i] == "--currency") fmt = "%.2f"
    else if (ARGV[i] == "-h" || ARGV[i] == "--help") {
       system("grep -v '^#' " nosql_install "/help/total.txt")
       rc = 1
       exit(rc)
    }
    else target_cols[ARGV[i]] = ARGV[i]
  }

  ARGC = 1					# Fix argv[]

  if (o_file == NULL) o_file = stdout
  if (i_file != NULL) { ARGV[1] = i_file; ARGC = 2 }
}

#
# Main loop
#

NR == 1 {

  gsub(/\001/, "")			# Remove SOH markers

  # Load the column position array.
  while (++p <= NF) {

    # Unless '-l' was specified, make sure we pick the first occurrence
    # of duplicated column names (it may happen after a join).

    if (pick_last) { P[$p] = p; N[p] = $p }
    else {
      if (P[$p] == NULL) { P[$p] = p; N[p] = $p }
    }
  }

  if (gtcol != NULL) $0 = $0 OFS gtcol
  if (!no_hdr) {
     printf("\001") > o_file; gsub(/\t/,"\t\001"); print > o_file
  }
  next
}

# Table body.
{
  for (i=1; i<=NF; i++) {
      if (target_cols[N[i]] != NULL && i == P[N[i]]) total[i] += $i
  }
  if (gtcol != NULL) $0 = $0 OFS
  if (report) print > o_file
}

END {
  if (rc) exit(rc)
  for (i=1; i<=NF; i++) {
      if (i > 1) value = value OFS
      if (target_cols[N[i]] != NULL && i == P[N[i]]) {
	 if (gtcol != NULL) gt += total[i]
	 value = value sprintf(fmt, total[i])
      }
  }

  if (gtcol != NULL) value = value sprintf(fmt, gt)

  if (report) {
     dashes = value
     gsub(/[^\t]+/,"-",dashes)
     print dashes > o_file
  }

  print value > o_file

  if (report) {
     gsub(/[^\t]+/,"=",value)
     print value > o_file
  }
}

# End of program.
