vdw/trunk/WOU_Util.pm

package WOU_Util;

# Utilities
#
# Jeremy Hickerson, 3/5/2002

use strict;
use Safe;

BEGIN {
    use Exporter   ();
    use vars       qw($VERSION @ISA @EXPORT @EXPORT_OK %EXPORT_TAGS);

    # set the version for version checking
    $VERSION     = 1.00;
    @ISA         = qw(Exporter);
    @EXPORT      = qw(&compound_sort &hash_compare &output_delimited
                      &date_stamp &arr2hash &date_compare &add2hash &fix_nulls
                      &ssn_format &join_table_subs &is_true &draw_from_hat
                      &num_sort &add_commas2dollars add_commas
                      &date_stamp_mrep &date_sort &delta_time
                      &outer_join_table_subs);
    %EXPORT_TAGS = ( );     # eg: TAG => [ qw!name1 name2! ],
    @EXPORT_OK   = qw( );
}
use vars @EXPORT_OK;
use subs qw(compound_sort sort_nested_hash hash_compare output_delimited
            date_stamp arr2hash date_compare add2hash fix_nulls ssn_format
            join_table_subs is_true draw_from_hat num_sort add_commas2dollars
            add_commas date_stamp_mrep date_sort delta_time
            outer_join_table_subs);

my $compartment = new Safe;

$compartment->permit(qw());  # nothing!  just need comparison operators

# ============================================================================
#                                 Routines
# ============================================================================
sub compound_sort {

                                      # "special sort" param is optional
    my ($rrecords_hash, $rkeys_array, $rh_special_sort) = @_;

    my ($arr_size, $rresults_array, $rrecord_key, $sort_key, $sortkey_val,
        %sort_category_hash, $rsort_category_array, $depth);

    # Returns reference to array holding all values in compound sort order.
    #
    # Explanation
    # -----------
    # %{$rrecords_hash} is a hash of hashes, where the hashes have the keys in
    # @$rkeys_array (and maybe some additional fields).  Each hash is uniquely
    # identified by $rrecords_hash->{$rrecord_key}.
    #
    # Below is an example of %records_hash
    #    $term_code{$pidm} = { };
    #    $rrecord_key = $term_code{$pidm};
    #
    #    $records{$rrecord_key} = 
    #    { "term"        => $term_code,
    #      "ethnicity"   => $ethnicity,
    #      "recr_status" => $recr_status,
    #      "first_name"  => $rname,
    #      "middle_name" => $rname,
    #      "last_name"   => $rname,
    #      "street"      => $raddr,
    #      "city"        => $raddr,
    #      "state"       => $raddr,
    #      "zip"         => $raddr,
    #      "nation"      => $raddr,
    #      "phone"       => $phone,
    #      "major"       => $major,
    #      "gpa"         => $gpa,
    #      "high_school" => $high_school };
    #
    # So %records is of the form (r2a => r3a, r2b => r3b, ... r2n => r3n),
    # where the r2's are the $$record_key's and the r3's are the anonymous
    # hashes of ("term" => $term_code, "ethnicity" => $ethnicity, ...).
    #
    # Compound sorting will be accomplished by building a hash of nested
    # hash references, and pushing each $rrecord_key onto an array reference
    # held by the hash at the end of the hash reference chain.
    # If @$rkeys_array = ("term_code", "ethnicity", "recr_status") then this
    # array reference (call it $rsort_category_array) is of the form
    #
    #     $sort_category_hash{$term_code}->{$ethnicity}->{$recr_status}.
    #
    # The values of $term_code, $ethnicity, etc. for any record are given by 
    #
    #      $sortkey_val = $rrecords_hash->{$rrecord_key}->{$sort_key};
    #
    # Each @{$rsort_category_array} holds all the records that belong to the
    # given compound sort category.


    if (defined($rh_special_sort) ) {
        # make sure $rh_special_sort{$sort_key} is defined for all values so
        # we don't have to check on every inner loop iteration below.
        foreach $sort_key (@{$rkeys_array}) {
            if (!exists($rh_special_sort->{$sort_key}) ) {
                $rh_special_sort->{$sort_key} = "";
            }
        }
    }

    # ===================
    #  Build Nested Hash
    # ===================
    #  Builds a nested hash where the nested keys are values specific to this
    #  record.  We will then sort the keys from the outermost to the innermost.
    #  Need to do numeric sort where needed based on the existence of the
    #  hash key 'sort' at the given hash level.  The numeric sort routine
    #  (or any other type of special sort on a given key will be passed in
    #  $rh_special_sort, where the hash key is the sort column value and the
    #  hash value is the perl code reference for the special sort routine.
    #  This code ref will be put on the hash key 'sort' at the appropriate
    #  level when the nested keys are created below.
    foreach $rrecord_key (keys %{$rrecords_hash}) {

    foreach $sort_key (@{$rkeys_array}) {

        # Put special sort routine in at every level needed.  Will just
        # overwrite it w/ the same value every iteration; this is probably
        # faster than checking for its existence every time.

        $sortkey_val = $rrecords_hash->{$rrecord_key}->{$sort_key};
        $arr_size = @{$rkeys_array};

        if ($sort_key eq $rkeys_array->[0]) {  # on first sort_key

            $sort_category_hash{"sort"} = $rh_special_sort->{$sort_key};

        $sort_category_hash{$sortkey_val} =
                $sort_key ne $rkeys_array->[$arr_size - 1] ?  { } : [ ]
            unless exists $sort_category_hash{$sortkey_val};

        $rsort_category_array = $sort_category_hash{$sortkey_val};
        }
        else {

            $rsort_category_array->{"sort"} = $rh_special_sort->{$sort_key};

            # nest this reference in previous reference
            $rsort_category_array->{$sortkey_val} =
                $sort_key ne $rkeys_array->[$arr_size - 1] ?  { } : [ ]
                unless exists $rsort_category_array->{$sortkey_val};

            $rsort_category_array = $rsort_category_array->{$sortkey_val}; 
        }
    }

    # put the record key on full nested reference
        push @{$rsort_category_array}, $rrecords_hash->{$rrecord_key};
    }

    # ==================
    #  Sort Nested Hash
    # ==================
    $depth = @{$rkeys_array};
    $rresults_array =
        sort_nested_hash(\%sort_category_hash, $depth);

    return $rresults_array;
}


sub sort_nested_hash {
    my ($rsort_category_hash, $depth) = @_;

    # Recurses to $depth, sorting hash %{$rsort_category_hash} keys at every
    # level.  Pushes values at final levels onto @sort_results,  which ends
    # up holding all values in correct compound sort order.

    my ($sorted_key, @sorted_keys_array, @sort_results, $rresults_array,
        $hash_ref, $sort_sub);

    #===============================
    # check if we're done recursing
    #===============================
    if ($depth == 0) {
        # return array of record_keys for this compound sort category
        # (remember, rsort_category_hash now points to an anonymous array
    # of anonymous hashes at the final nested hash key)
        return $rsort_category_hash;
    }

    #==========================================
    # otherwise, sort the keys at this depth
    # and call self to sort keys at next depth
    #==========================================
    if ( $rsort_category_hash->{sort} ) {
        $sort_sub = $rsort_category_hash->{sort};
        delete $rsort_category_hash->{sort};  # otherwise it will be in the output

        @sorted_keys_array = sort $sort_sub keys %{$rsort_category_hash};
    }
    else {
        delete $rsort_category_hash->{sort};  # delete dummy sort key
        @sorted_keys_array = sort keys %{$rsort_category_hash};
    }


    foreach $sorted_key (@sorted_keys_array) {

        # "append" $sorted_key to hash ref passed in and call self
        $rresults_array = sort_nested_hash($rsort_category_hash->{$sorted_key},
                                       $depth - 1);

        push @sort_results, @{$rresults_array};
    }

    return \@sort_results;
}

# hash_compare():  compares fields in record 1 with fields in record 2.  Allows
# Oracle '%' wildcard at end of expression, ignores case.
sub hash_compare {

    my ($rh_hash1, $rh_hash2) = @_;
    my ($field_name, $hash2_field_re);

    # if we look at each hash as a record in a table, where the keys
    # are the field names and the values the field values, then we
    # compare if the same field names have the same values.  We take
    # hash2 to be a subset of hash 1.  If not (i.e. if hash2 has a 
    # field that isn't in hash1) then the hashes don't match.  If all
    # values for fields in hash2 match the values for the same fields
    # in hash1 then the hashes match.  We allow a "%" wildcard at the
    # end of a string.  "xyz%" matches /^(xyz)(.*)$/  (like
    # the Oracle "like 'xyz%'", but only at the end of a string).

    foreach $field_name (keys %{$rh_hash2} ) {

        $hash2_field_re = $rh_hash2->{$field_name};

        $hash2_field_re =~ s/^(.*)%$/$1\(\.\*\)/;

        if ( ! exists $rh_hash1->{$field_name} ||
             $rh_hash1->{$field_name} !~ /^$hash2_field_re$/i ) {

            return 0;  # "record" doesn't match - return false
        }
    }

    # fall-through means all fields in hash1 matched, so "record" matches
    # return true
    return 1;
}


sub output_delimited {
    my ($fh_out, $ra_records, $ra_field_order, $rh_field_titles, $delim,
        $no_titles) = @_;

    my ($rh_record, $field_name, $save_ors);

    if (!$delim ) { $delim = "\|" }  # "|" is default

    fix_nulls($ra_records);  # clean up data

    # check Output Record Separator
    if ( defined($\) ) {
        $save_ors = $\;
        $\ = "";  # disable for field-by-field print below
    }

    # output delimited field titles
    if ( !$no_titles or uc($no_titles) eq "N" ) {
        foreach $field_name (@{$ra_field_order} ) {
            # print $field_name for field title if no $rh_field_titles
            print $fh_out $rh_field_titles ? $rh_field_titles->{$field_name}
                                       : $field_name;

            # don't print delimiter if on last field
            print $fh_out $delim unless $field_name eq
                $ra_field_order->[ @{$ra_field_order} - 1 ];
        }

        if ( defined($save_ors) ) {
            print $fh_out $save_ors;
        }
        else {
            print $fh_out "\n";
        }
    }

    OUTPUT_LOOP:
    foreach $rh_record (@{$ra_records} ) {

        next OUTPUT_LOOP unless defined( %{$rh_record} ); 

        # fall-through   

        # output delimited field values
        foreach $field_name (@{$ra_field_order} ) {
            # allow the possibility that records may not have all the fields
            if ( exists $rh_record->{$field_name} ) {
                print $fh_out $rh_record->{$field_name};
            }

            # don't print delimiter if on last field
            print $fh_out $delim unless $field_name eq
            $ra_field_order->[ @{$ra_field_order} - 1 ];
        }

        if ( defined($save_ors) ) {
            $\ = $save_ors;  # restore saved value to $\
            print $fh_out "";  # this will print the Output Record Separator
        }
        else {
            print $fh_out "\n";
        }
    }
}


sub date_stamp {
    my @ts = localtime;
    my $timestamp = sprintf "%d/%d/%d  %.2d:%.2d",
                 $ts[4] + 1,
                 $ts[3],
                 1900 + $ts[5],
                 $ts[2],
                 $ts[1];
    return $timestamp;
}


sub date_stamp_mrep {

    my %months = ( 1   =>  "JAN",
                   2   =>  "FEB",
                   3   =>  "MAR",
                   4   =>  "APR",
                   5   =>  "MAY",
                   6   =>  "JUN",
                   7   =>  "JUL",
                   8   =>  "AUG",
                   9   =>  "SEP",
                   10  =>  "OCT",
                   11  =>  "NOV",
                   12  =>  "DEC"  );

    my @ts = localtime;
    my $timestamp = sprintf "%.2d-%s-%.2d %.2d:%.2d:%.2d",
                 $ts[3],
                 $months{ $ts[4] + 1 },
                 substr(1900 + $ts[5], 2, 2),
                 $ts[2],
                 $ts[1],
                 $ts[0];
    return $timestamp;
}


sub arr2hash {
    my $array_ref = shift;

    my ($value, %hash, $i);

    $i = 0;
    foreach $value ( @{$array_ref} ) { $hash{$i++} = $value }
    return \%hash;
}


sub date_compare {
    my ($date, $op, $refdate) = @_;

    my ($mm_date, $dd_date, $yyyy_date) = split(/\//, $date);
    my ($mm_ref, $dd_ref, $yyyy_ref) = split(/\//, $refdate);

    my $date_str = $yyyy_date . $mm_date . $dd_date;
    my $ref_str  = $yyyy_ref  . $mm_ref  . $dd_ref;

    $compartment->reval( qq{
        ($date_str $op $ref_str) || return 0;

     # fall-through
     return 1;
    } );
}


# Note:  You don't have to pass $rh_field_map, and if passed, it doesn't need
# values for every field.  This sub will translate the fieldnames passed in
# $rh_field_map (if any) and leave the rest unchanged.
sub add2hash {

    my ($rh_hash1, $rh_hash2, $rh_field_map) = @_;

    my ($new_key, $mapped_key);

    foreach $new_key ( keys %{$rh_hash2} ) {

        if ( defined($rh_field_map) and
             exists($rh_field_map->{$new_key} ) ) {
            $mapped_key = $rh_field_map->{$new_key};
        }
        else { $mapped_key = $new_key }

        if (!exists($rh_hash1->{$mapped_key} )  ) {  # if name conflict, hash1 wins
            $rh_hash1->{$mapped_key} = $rh_hash2->{$new_key};
        }
    }
}


sub fix_nulls {

    my $ra_hashes = shift;

    my ($rh_hash, $field);

    FIX_LOOP:
    for $rh_hash ( @{ $ra_hashes } ) {

        next FIX_LOOP unless defined( %{$rh_hash} );

        # fall-through

        for $field ( keys %{ $rh_hash } ) {

            if ( !defined($rh_hash->{$field} )  ) {
                $rh_hash->{$field} = "";
            }

        }
    }
}


sub ssn_format {
    my $str = shift;

    length($str) < 6 && return $str;

    # fall-through
    return substr($str, 0, 3) . "-" . substr($str, 3, 2) . "-" . substr($str, 5);
}


# Has optional final parm "outer_join".  If outer_join is 'Y' then will return
# rows from sub1 even if no corresponding rows from sub2.
sub join_table_subs {
    my ($rs_sub1, $ra_parms1, $rs_sub2, $ra_parms2, $outer_join) = @_;

    my (@new_table, $ra_sub1, $rh_sub1, $ra_sub2, $rh_sub2, @subst_parms, $parm,
        $subst_parm, $rh_new, $got_join_rows);

    $ra_sub1 = &{ $rs_sub1 } ( @{ $ra_parms1 } );


    foreach $rh_sub1 ( @{ $ra_sub1 } ) {

        while (shift @subst_parms) { }  # reset

        # substitute $rh_sub1 values for relational parms (identified by "$" prefix)
        foreach $parm ( @{$ra_parms2} ) {
            $subst_parm = $parm;

            if ( $subst_parm =~ /^\$/ ) {
                $subst_parm =~ s/^\$//;

                $subst_parm = $rh_sub1->{$subst_parm};
            }

            push @subst_parms, $subst_parm;
        }

        $ra_sub2 = &{ $rs_sub2 } ( @subst_parms );

        $got_join_rows = 0;
        foreach $rh_sub2 ( @{ $ra_sub2 } ) {

            $got_join_rows = 1;
            $rh_new = { };  # get new memory
            add2hash($rh_new, $rh_sub1);  # "dup" $rh_sub1

            add2hash($rh_new, $rh_sub2);
            push @new_table, $rh_new;
        }

        if ( defined($outer_join) and
             $outer_join eq 'Y'   and
             !$got_join_rows ) {

            $rh_new = { };  # get new memory
            add2hash($rh_new, $rh_sub1);  # "dup" $rh_sub1

            push @new_table, $rh_new;
        }
    }

    return \@new_table;
}


sub is_true {

    my $comparison_str = shift;

    $compartment->reval( qq{
        if ($comparison_str) { return 1 }

        # fall-through
        return 0;
    } );
}


# draw_from_hat() - single arg is ref to array of scalar identifiers
sub draw_from_hat {

    my $ra_population = shift;

    my ($identifier, %rand_population, $cnt, $rand_no, @sorted_keys,
        @save_sorted_keys, $rand_key, $pop_size, $size);

    $pop_size = @{$ra_population};


    # put each identifier into %rand_population under a random key
    foreach $identifier (@$ra_population) {

    $rand_no = rand;
    while ( exists $rand_population{$rand_no} ) {
        $rand_no = rand;
    }

    $rand_population{$rand_no} = $identifier;
    }


    # pick the random number of times to iterate
    $rand_no = 0;

    while ( $rand_no <= 0 ) {
    $rand_no = rand;
    }

    $rand_no *= ($pop_size * 5);  # go through population up to 5 times just
                                  # so we don't have any bias for or against
                                  # those at the beginning or end of the
                                  # population (note:  rand returns decimals
                                  # between 0 and 1)

    $rand_no = sprintf("%d", $rand_no + 1);  # make sure the integer part is > 0
                         # so that we get at least 1 iteration


    # sort by random keys and iterate a random number of times to pick the winner

    @sorted_keys = (sort keys %rand_population);
    @save_sorted_keys = @sorted_keys;

    $cnt     = 0;

    while ( $cnt != $rand_no ) {

    $cnt++;

    $size = @sorted_keys;

    ( $size ) || ( @sorted_keys = @save_sorted_keys );

    $rand_key = shift @sorted_keys;

    }


    return $rand_population{$rand_key};

}


sub num_sort {
    $a <=> $b;
}

sub date_sort {
    date_compare($a, "<",  $b) && return  -1;
    date_compare($a, "==", $b) && return   0;
    date_compare($a, ">",  $b) && return   1;
}


sub add_commas2dollars {

    my $amount = shift;

    my ($dollars, $cents);

    ($dollars, $cents) = split(/\./, $amount);

    if ( !defined($cents) ) { $cents = 0 };

    return add_commas($dollars) . '.' . substr(sprintf("%.2d", $cents), 0, 2);
}


sub add_commas {

    my $integer = shift;

    my ($digit, $pos, @digits, $char, $cnt, $integer_w_commas);

    $cnt = 0;
    # grab each digit starting w/ the last
    for ( $pos = length($integer) - 1; $pos >= 0; $pos-- ) {

        $cnt++;

        $digit = substr($integer, $pos, 1);
        push @digits, $digit;

        if ( $cnt % 3 == 0 ) {
            push @digits, ',';
        }
    }

    while ( defined($char = pop @digits) ) {
        $integer_w_commas .= $char;
    }

    $integer_w_commas =~ s/^,//;  # in case $cnt ended on a multiple of 3

    return $integer_w_commas;
}


sub delta_time {

    my $delta_hrs = shift;

    defined($delta_hrs) && $delta_hrs =~ /^[-+]*\d+/
        or die "ERROR:  bad param $delta_hrs";

    my (@ts);

    @ts = localtime( time() + ($delta_hrs * 3600) );

    # fall-through
    my $timestamp = sprintf "%.2d/%.2d/%d  %.2d:%.2d",
    $ts[4] + 1,
    $ts[3],
    1900 + $ts[5],
    $ts[2],
    $ts[1];

    return $timestamp;
}


return 1;  # for module


1	package WOU_Util;
2
3	# Utilities
4	#
5	# Jeremy Hickerson, 3/5/2002
6
7	use strict;
8	use Safe;
9
10	BEGIN {
11	use Exporter ();
12	use vars qw($VERSION @ISA @EXPORT @EXPORT_OK %EXPORT_TAGS);
13
14	# set the version for version checking
15	$VERSION = 1.00;
16	@ISA = qw(Exporter);
17	@EXPORT = qw(&compound_sort &hash_compare &output_delimited
18	&date_stamp &arr2hash &date_compare &add2hash &fix_nulls
19	&ssn_format &join_table_subs &is_true &draw_from_hat
20	&num_sort &add_commas2dollars add_commas
21	&date_stamp_mrep &date_sort &delta_time
22	&outer_join_table_subs);
23	%EXPORT_TAGS = ( ); # eg: TAG => [ qw!name1 name2! ],
24	@EXPORT_OK = qw( );
25	}
26	use vars @EXPORT_OK;
27	use subs qw(compound_sort sort_nested_hash hash_compare output_delimited
28	date_stamp arr2hash date_compare add2hash fix_nulls ssn_format
29	join_table_subs is_true draw_from_hat num_sort add_commas2dollars
30	add_commas date_stamp_mrep date_sort delta_time
31	outer_join_table_subs);
32
33	my $compartment = new Safe;
34
35	$compartment->permit(qw()); # nothing! just need comparison operators
36
37	# ============================================================================
38	# Routines
39	# ============================================================================
40	sub compound_sort {
41
42	# "special sort" param is optional
43	my ($rrecords_hash, $rkeys_array, $rh_special_sort) = @_;
44
45	my ($arr_size, $rresults_array, $rrecord_key, $sort_key, $sortkey_val,
46	%sort_category_hash, $rsort_category_array, $depth);
47
48	# Returns reference to array holding all values in compound sort order.
49	#
50	# Explanation
51	# -----------
52	# %{$rrecords_hash} is a hash of hashes, where the hashes have the keys in
53	# @$rkeys_array (and maybe some additional fields). Each hash is uniquely
54	# identified by $rrecords_hash->{$rrecord_key}.
55	#
56	# Below is an example of %records_hash
57	# $term_code{$pidm} = { };
58	# $rrecord_key = $term_code{$pidm};
59	#
60	# $records{$rrecord_key} =
61	# { "term" => $term_code,
62	# "ethnicity" => $ethnicity,
63	# "recr_status" => $recr_status,
64	# "first_name" => $rname,
65	# "middle_name" => $rname,
66	# "last_name" => $rname,
67	# "street" => $raddr,
68	# "city" => $raddr,
69	# "state" => $raddr,
70	# "zip" => $raddr,
71	# "nation" => $raddr,
72	# "phone" => $phone,
73	# "major" => $major,
74	# "gpa" => $gpa,
75	# "high_school" => $high_school };
76	#
77	# So %records is of the form (r2a => r3a, r2b => r3b, ... r2n => r3n),
78	# where the r2's are the $$record_key's and the r3's are the anonymous
79	# hashes of ("term" => $term_code, "ethnicity" => $ethnicity, ...).
80	#
81	# Compound sorting will be accomplished by building a hash of nested
82	# hash references, and pushing each $rrecord_key onto an array reference
83	# held by the hash at the end of the hash reference chain.
84	# If @$rkeys_array = ("term_code", "ethnicity", "recr_status") then this
85	# array reference (call it $rsort_category_array) is of the form
86	#
87	# $sort_category_hash{$term_code}->{$ethnicity}->{$recr_status}.
88	#
89	# The values of $term_code, $ethnicity, etc. for any record are given by
90	#
91	# $sortkey_val = $rrecords_hash->{$rrecord_key}->{$sort_key};
92	#
93	# Each @{$rsort_category_array} holds all the records that belong to the
94	# given compound sort category.
95
96
97	if (defined($rh_special_sort) ) {
98	# make sure $rh_special_sort{$sort_key} is defined for all values so
99	# we don't have to check on every inner loop iteration below.
100	foreach $sort_key (@{$rkeys_array}) {
101	if (!exists($rh_special_sort->{$sort_key}) ) {
102	$rh_special_sort->{$sort_key} = "";
103	}
104	}
105	}
106
107	# ===================
108	# Build Nested Hash
109	# ===================
110	# Builds a nested hash where the nested keys are values specific to this
111	# record. We will then sort the keys from the outermost to the innermost.
112	# Need to do numeric sort where needed based on the existence of the
113	# hash key 'sort' at the given hash level. The numeric sort routine
114	# (or any other type of special sort on a given key will be passed in
115	# $rh_special_sort, where the hash key is the sort column value and the
116	# hash value is the perl code reference for the special sort routine.
117	# This code ref will be put on the hash key 'sort' at the appropriate
118	# level when the nested keys are created below.
119	foreach $rrecord_key (keys %{$rrecords_hash}) {
120
121	foreach $sort_key (@{$rkeys_array}) {
122
123	# Put special sort routine in at every level needed. Will just
124	# overwrite it w/ the same value every iteration; this is probably
125	# faster than checking for its existence every time.
126
127	$sortkey_val = $rrecords_hash->{$rrecord_key}->{$sort_key};
128	$arr_size = @{$rkeys_array};
129
130	if ($sort_key eq $rkeys_array->[0]) { # on first sort_key
131
132	$sort_category_hash{"sort"} = $rh_special_sort->{$sort_key};
133
134	$sort_category_hash{$sortkey_val} =
135	$sort_key ne $rkeys_array->[$arr_size - 1] ? { } : [ ]
136	unless exists $sort_category_hash{$sortkey_val};
137
138	$rsort_category_array = $sort_category_hash{$sortkey_val};
139	}
140	else {
141
142	$rsort_category_array->{"sort"} = $rh_special_sort->{$sort_key};
143
144	# nest this reference in previous reference
145	$rsort_category_array->{$sortkey_val} =
146	$sort_key ne $rkeys_array->[$arr_size - 1] ? { } : [ ]
147	unless exists $rsort_category_array->{$sortkey_val};
148
149	$rsort_category_array = $rsort_category_array->{$sortkey_val};
150	}
151	}
152
153	# put the record key on full nested reference
154	push @{$rsort_category_array}, $rrecords_hash->{$rrecord_key};
155	}
156
157	# ==================
158	# Sort Nested Hash
159	# ==================
160	$depth = @{$rkeys_array};
161	$rresults_array =
162	sort_nested_hash(\%sort_category_hash, $depth);
163
164	return $rresults_array;
165	}
166
167
168	sub sort_nested_hash {
169	my ($rsort_category_hash, $depth) = @_;
170
171	# Recurses to $depth, sorting hash %{$rsort_category_hash} keys at every
172	# level. Pushes values at final levels onto @sort_results, which ends
173	# up holding all values in correct compound sort order.
174
175	my ($sorted_key, @sorted_keys_array, @sort_results, $rresults_array,
176	$hash_ref, $sort_sub);
177
178	#===============================
179	# check if we're done recursing
180	#===============================
181	if ($depth == 0) {
182	# return array of record_keys for this compound sort category
183	# (remember, rsort_category_hash now points to an anonymous array
184	# of anonymous hashes at the final nested hash key)
185	return $rsort_category_hash;
186	}
187
188	#==========================================
189	# otherwise, sort the keys at this depth
190	# and call self to sort keys at next depth
191	#==========================================
192	if ( $rsort_category_hash->{sort} ) {
193	$sort_sub = $rsort_category_hash->{sort};
194	delete $rsort_category_hash->{sort}; # otherwise it will be in the output
195
196	@sorted_keys_array = sort $sort_sub keys %{$rsort_category_hash};
197	}
198	else {
199	delete $rsort_category_hash->{sort}; # delete dummy sort key
200	@sorted_keys_array = sort keys %{$rsort_category_hash};
201	}
202
203
204	foreach $sorted_key (@sorted_keys_array) {
205
206	# "append" $sorted_key to hash ref passed in and call self
207	$rresults_array = sort_nested_hash($rsort_category_hash->{$sorted_key},
208	$depth - 1);
209
210	push @sort_results, @{$rresults_array};
211	}
212
213	return \@sort_results;
214	}
215
216	# hash_compare(): compares fields in record 1 with fields in record 2. Allows
217	# Oracle '%' wildcard at end of expression, ignores case.
218	sub hash_compare {
219
220	my ($rh_hash1, $rh_hash2) = @_;
221	my ($field_name, $hash2_field_re);
222
223	# if we look at each hash as a record in a table, where the keys
224	# are the field names and the values the field values, then we
225	# compare if the same field names have the same values. We take
226	# hash2 to be a subset of hash 1. If not (i.e. if hash2 has a
227	# field that isn't in hash1) then the hashes don't match. If all
228	# values for fields in hash2 match the values for the same fields
229	# in hash1 then the hashes match. We allow a "%" wildcard at the
230	# end of a string. "xyz%" matches /^(xyz)(.*)$/ (like
231	# the Oracle "like 'xyz%'", but only at the end of a string).
232
233	foreach $field_name (keys %{$rh_hash2} ) {
234
235	$hash2_field_re = $rh_hash2->{$field_name};
236
237	$hash2_field_re =~ s/^(.)%$/$1\(\.\\)/;
238
239	if ( ! exists $rh_hash1->{$field_name} \|\|
240	$rh_hash1->{$field_name} !~ /^$hash2_field_re$/i ) {
241
242	return 0; # "record" doesn't match - return false
243	}
244	}
245
246	# fall-through means all fields in hash1 matched, so "record" matches
247	# return true
248	return 1;
249	}
250
251
252	sub output_delimited {
253	my ($fh_out, $ra_records, $ra_field_order, $rh_field_titles, $delim,
254	$no_titles) = @_;
255
256	my ($rh_record, $field_name, $save_ors);
257
258	if (!$delim ) { $delim = "\\|" } # "\|" is default
259
260	fix_nulls($ra_records); # clean up data
261
262	# check Output Record Separator
263	if ( defined($\) ) {
264	$save_ors = $\;
265	$\ = ""; # disable for field-by-field print below
266	}
267
268	# output delimited field titles
269	if ( !$no_titles or uc($no_titles) eq "N" ) {
270	foreach $field_name (@{$ra_field_order} ) {
271	# print $field_name for field title if no $rh_field_titles
272	print $fh_out $rh_field_titles ? $rh_field_titles->{$field_name}
273	: $field_name;
274
275	# don't print delimiter if on last field
276	print $fh_out $delim unless $field_name eq
277	$ra_field_order->[ @{$ra_field_order} - 1 ];
278	}
279
280	if ( defined($save_ors) ) {
281	print $fh_out $save_ors;
282	}
283	else {
284	print $fh_out "\n";
285	}
286	}
287
288	OUTPUT_LOOP:
289	foreach $rh_record (@{$ra_records} ) {
290
291	next OUTPUT_LOOP unless defined( %{$rh_record} );
292
293	# fall-through
294
295	# output delimited field values
296	foreach $field_name (@{$ra_field_order} ) {
297	# allow the possibility that records may not have all the fields
298	if ( exists $rh_record->{$field_name} ) {
299	print $fh_out $rh_record->{$field_name};
300	}
301
302	# don't print delimiter if on last field
303	print $fh_out $delim unless $field_name eq
304	$ra_field_order->[ @{$ra_field_order} - 1 ];
305	}
306
307	if ( defined($save_ors) ) {
308	$\ = $save_ors; # restore saved value to $\
309	print $fh_out ""; # this will print the Output Record Separator
310	}
311	else {
312	print $fh_out "\n";
313	}
314	}
315	}
316
317
318	sub date_stamp {
319	my @ts = localtime;
320	my $timestamp = sprintf "%d/%d/%d %.2d:%.2d",
321	$ts[4] + 1,
322	$ts[3],
323	1900 + $ts[5],
324	$ts[2],
325	$ts[1];
326	return $timestamp;
327	}
328
329
330	sub date_stamp_mrep {
331
332	my %months = ( 1 => "JAN",
333	2 => "FEB",
334	3 => "MAR",
335	4 => "APR",
336	5 => "MAY",
337	6 => "JUN",
338	7 => "JUL",
339	8 => "AUG",
340	9 => "SEP",
341	10 => "OCT",
342	11 => "NOV",
343	12 => "DEC" );
344
345	my @ts = localtime;
346	my $timestamp = sprintf "%.2d-%s-%.2d %.2d:%.2d:%.2d",
347	$ts[3],
348	$months{ $ts[4] + 1 },
349	substr(1900 + $ts[5], 2, 2),
350	$ts[2],
351	$ts[1],
352	$ts[0];
353	return $timestamp;
354	}
355
356
357	sub arr2hash {
358	my $array_ref = shift;
359
360	my ($value, %hash, $i);
361
362	$i = 0;
363	foreach $value ( @{$array_ref} ) { $hash{$i++} = $value }
364	return \%hash;
365	}
366
367
368	sub date_compare {
369	my ($date, $op, $refdate) = @_;
370
371	my ($mm_date, $dd_date, $yyyy_date) = split(/\//, $date);
372	my ($mm_ref, $dd_ref, $yyyy_ref) = split(/\//, $refdate);
373
374	my $date_str = $yyyy_date . $mm_date . $dd_date;
375	my $ref_str = $yyyy_ref . $mm_ref . $dd_ref;
376
377	$compartment->reval( qq{
378	($date_str $op $ref_str) \|\| return 0;
379
380	# fall-through
381	return 1;
382	} );
383	}
384
385
386	# Note: You don't have to pass $rh_field_map, and if passed, it doesn't need
387	# values for every field. This sub will translate the fieldnames passed in
388	# $rh_field_map (if any) and leave the rest unchanged.
389	sub add2hash {
390
391	my ($rh_hash1, $rh_hash2, $rh_field_map) = @_;
392
393	my ($new_key, $mapped_key);
394
395	foreach $new_key ( keys %{$rh_hash2} ) {
396
397	if ( defined($rh_field_map) and
398	exists($rh_field_map->{$new_key} ) ) {
399	$mapped_key = $rh_field_map->{$new_key};
400	}
401	else { $mapped_key = $new_key }
402
403	if (!exists($rh_hash1->{$mapped_key} ) ) { # if name conflict, hash1 wins
404	$rh_hash1->{$mapped_key} = $rh_hash2->{$new_key};
405	}
406	}
407	}
408
409
410	sub fix_nulls {
411
412	my $ra_hashes = shift;
413
414	my ($rh_hash, $field);
415
416	FIX_LOOP:
417	for $rh_hash ( @{ $ra_hashes } ) {
418
419	next FIX_LOOP unless defined( %{$rh_hash} );
420
421	# fall-through
422
423	for $field ( keys %{ $rh_hash } ) {
424
425	if ( !defined($rh_hash->{$field} ) ) {
426	$rh_hash->{$field} = "";
427	}
428
429	}
430	}
431	}
432
433
434	sub ssn_format {
435	my $str = shift;
436
437	length($str) < 6 && return $str;
438
439	# fall-through
440	return substr($str, 0, 3) . "-" . substr($str, 3, 2) . "-" . substr($str, 5);
441	}
442
443
444	# Has optional final parm "outer_join". If outer_join is 'Y' then will return
445	# rows from sub1 even if no corresponding rows from sub2.
446	sub join_table_subs {
447	my ($rs_sub1, $ra_parms1, $rs_sub2, $ra_parms2, $outer_join) = @_;
448
449	my (@new_table, $ra_sub1, $rh_sub1, $ra_sub2, $rh_sub2, @subst_parms, $parm,
450	$subst_parm, $rh_new, $got_join_rows);
451
452	$ra_sub1 = &{ $rs_sub1 } ( @{ $ra_parms1 } );
453
454
455	foreach $rh_sub1 ( @{ $ra_sub1 } ) {
456
457	while (shift @subst_parms) { } # reset
458
459	# substitute $rh_sub1 values for relational parms (identified by "$" prefix)
460	foreach $parm ( @{$ra_parms2} ) {
461	$subst_parm = $parm;
462
463	if ( $subst_parm =~ /^\$/ ) {
464	$subst_parm =~ s/^\$//;
465
466	$subst_parm = $rh_sub1->{$subst_parm};
467	}
468
469	push @subst_parms, $subst_parm;
470	}
471
472	$ra_sub2 = &{ $rs_sub2 } ( @subst_parms );
473
474	$got_join_rows = 0;
475	foreach $rh_sub2 ( @{ $ra_sub2 } ) {
476
477	$got_join_rows = 1;
478	$rh_new = { }; # get new memory
479	add2hash($rh_new, $rh_sub1); # "dup" $rh_sub1
480
481	add2hash($rh_new, $rh_sub2);
482	push @new_table, $rh_new;
483	}
484
485	if ( defined($outer_join) and
486	$outer_join eq 'Y' and
487	!$got_join_rows ) {
488
489	$rh_new = { }; # get new memory
490	add2hash($rh_new, $rh_sub1); # "dup" $rh_sub1
491
492	push @new_table, $rh_new;
493	}
494	}
495
496	return \@new_table;
497	}
498
499
500	sub is_true {
501
502	my $comparison_str = shift;
503
504	$compartment->reval( qq{
505	if ($comparison_str) { return 1 }
506
507	# fall-through
508	return 0;
509	} );
510	}
511
512
513	# draw_from_hat() - single arg is ref to array of scalar identifiers
514	sub draw_from_hat {
515
516	my $ra_population = shift;
517
518	my ($identifier, %rand_population, $cnt, $rand_no, @sorted_keys,
519	@save_sorted_keys, $rand_key, $pop_size, $size);
520
521	$pop_size = @{$ra_population};
522
523
524	# put each identifier into %rand_population under a random key
525	foreach $identifier (@$ra_population) {
526
527	$rand_no = rand;
528	while ( exists $rand_population{$rand_no} ) {
529	$rand_no = rand;
530	}
531
532	$rand_population{$rand_no} = $identifier;
533	}
534
535
536	# pick the random number of times to iterate
537	$rand_no = 0;
538
539	while ( $rand_no <= 0 ) {
540	$rand_no = rand;
541	}
542
543	$rand_no = ($pop_size 5); # go through population up to 5 times just
544	# so we don't have any bias for or against
545	# those at the beginning or end of the
546	# population (note: rand returns decimals
547	# between 0 and 1)
548
549	$rand_no = sprintf("%d", $rand_no + 1); # make sure the integer part is > 0
550	# so that we get at least 1 iteration
551
552
553	# sort by random keys and iterate a random number of times to pick the winner
554
555	@sorted_keys = (sort keys %rand_population);
556	@save_sorted_keys = @sorted_keys;
557
558	$cnt = 0;
559
560	while ( $cnt != $rand_no ) {
561
562	$cnt++;
563
564	$size = @sorted_keys;
565
566	( $size ) \|\| ( @sorted_keys = @save_sorted_keys );
567
568	$rand_key = shift @sorted_keys;
569
570	}
571
572
573	return $rand_population{$rand_key};
574
575	}
576
577
578	sub num_sort {
579	$a <=> $b;
580	}
581
582	sub date_sort {
583	date_compare($a, "<", $b) && return -1;
584	date_compare($a, "==", $b) && return 0;
585	date_compare($a, ">", $b) && return 1;
586	}
587
588
589	sub add_commas2dollars {
590
591	my $amount = shift;
592
593	my ($dollars, $cents);
594
595	($dollars, $cents) = split(/\./, $amount);
596
597	if ( !defined($cents) ) { $cents = 0 };
598
599	return add_commas($dollars) . '.' . substr(sprintf("%.2d", $cents), 0, 2);
600	}
601
602
603	sub add_commas {
604
605	my $integer = shift;
606
607	my ($digit, $pos, @digits, $char, $cnt, $integer_w_commas);
608
609	$cnt = 0;
610	# grab each digit starting w/ the last
611	for ( $pos = length($integer) - 1; $pos >= 0; $pos-- ) {
612
613	$cnt++;
614
615	$digit = substr($integer, $pos, 1);
616	push @digits, $digit;
617
618	if ( $cnt % 3 == 0 ) {
619	push @digits, ',';
620	}
621	}
622
623	while ( defined($char = pop @digits) ) {
624	$integer_w_commas .= $char;
625	}
626
627	$integer_w_commas =~ s/^,//; # in case $cnt ended on a multiple of 3
628
629	return $integer_w_commas;
630	}
631
632
633	sub delta_time {
634
635	my $delta_hrs = shift;
636
637	defined($delta_hrs) && $delta_hrs =~ /^[-+]*\d+/
638	or die "ERROR: bad param $delta_hrs";
639
640	my (@ts);
641
642	@ts = localtime( time() + ($delta_hrs * 3600) );
643
644	# fall-through
645	my $timestamp = sprintf "%.2d/%.2d/%d %.2d:%.2d",
646	$ts[4] + 1,
647	$ts[3],
648	1900 + $ts[5],
649	$ts[2],
650	$ts[1];
651
652	return $timestamp;
653	}
654
655
656	return 1; # for module
657
658