package Spreadsheet::WriteExcel::Utility; ############################################################################### # # Utility - Helper functions for Spreadsheet::WriteExcel. # # Copyright 2000-2010, John McNamara, jmcnamara@cpan.org # # use Exporter; use strict; use autouse 'Date::Calc' => qw(Delta_DHMS Decode_Date_EU Decode_Date_US); use autouse 'Date::Manip' => qw(ParseDate Date_Init); # Do all of the export preparation use vars qw($VERSION @ISA @EXPORT @EXPORT_OK %EXPORT_TAGS); # Row and column functions my @rowcol = qw( xl_rowcol_to_cell xl_cell_to_rowcol xl_range_formula xl_inc_row xl_dec_row xl_inc_col xl_dec_col ); # Date and Time functions my @dates = qw( xl_date_list xl_date_1904 xl_parse_time xl_parse_date xl_parse_date_init xl_decode_date_EU xl_decode_date_US ); @ISA = qw(Exporter); @EXPORT_OK = (); @EXPORT = (@rowcol, @dates); %EXPORT_TAGS = ( rowcol => \@rowcol, dates => \@dates ); $VERSION = '2.40'; =encoding latin1 =head1 NAME Utility - Helper functions for Spreadsheet::WriteExcel. =head1 SYNOPSIS Functions to help with some common tasks when using Spreadsheet::WriteExcel. These functions mainly relate to dealing with rows and columns in A1 notation and to handling dates and times. use Spreadsheet::WriteExcel::Utility; # Import everything ($row, $col) = xl_cell_to_rowcol('C2'); # (1, 2) $str = xl_rowcol_to_cell(1, 2); # C2 $str = xl_inc_col('Z1' ); # AA1 $str = xl_dec_col('AA1' ); # Z1 $date = xl_date_list(2002, 1, 1); # 37257 $date = xl_parse_date("11 July 1997"); # 35622 $time = xl_parse_time('3:21:36 PM'); # 0.64 $date = xl_decode_date_EU("13 May 2002"); # 37389 =head1 DESCRIPTION This module provides a set of functions to help with some common tasks encountered when using the Spreadsheet::WriteExcel module. The two main categories of function are: Row and column functions: these are used to deal with Excel's A1 representation of cells. The functions in this category are: xl_rowcol_to_cell xl_cell_to_rowcol xl_range_formula xl_inc_row xl_dec_row xl_inc_col xl_dec_col Date and Time functions: these are used to convert dates and times to the numeric format used by Excel. The functions in this category are: xl_date_list xl_date_1904 xl_parse_time xl_parse_date xl_parse_date_init xl_decode_date_EU xl_decode_date_US All of these functions are exported by default. However, you can use import lists if you wish to limit the functions that are imported: use Spreadsheet::WriteExcel::Utility; # Import everything use Spreadsheet::WriteExcel::Utility qw(xl_date_list); # xl_date_list only use Spreadsheet::WriteExcel::Utility qw(:rowcol); # Row/col functions use Spreadsheet::WriteExcel::Utility qw(:dates); # Date functions =head1 ROW AND COLUMN FUNCTIONS Spreadsheet::WriteExcel supports two forms of notation to designate the position of cells: Row-column notation and A1 notation. Row-column notation uses a zero based index for both row and column while A1 notation uses the standard Excel alphanumeric sequence of column letter and 1-based row. Columns range from A to IV i.e. 0 to 255, rows range from 1 to 16384 in Excel 5 and 65536 in Excel 97. For example: (0, 0) # The top left cell in row-column notation. ('A1') # The top left cell in A1 notation. (1999, 29) # Row-column notation. ('AD2000') # The same cell in A1 notation. Row-column notation is useful if you are referring to cells programmatically: for my $i (0 .. 9) { $worksheet->write($i, 0, 'Hello'); # Cells A1 to A10 } A1 notation is useful for setting up a worksheet manually and for working with formulas: $worksheet->write('H1', 200); $worksheet->write('H2', '=H7+1'); The functions in the following sections can be used for dealing with A1 notation, for example: ($row, $col) = xl_cell_to_rowcol('C2'); # (1, 2) $str = xl_rowcol_to_cell(1, 2); # C2 Cell references in Excel can be either relative or absolute. Absolute references are prefixed by the dollar symbol as shown below: A1 # Column and row are relative $A1 # Column is absolute and row is relative A$1 # Column is relative and row is absolute $A$1 # Column and row are absolute An absolute reference only has an effect if the cell is copied. Refer to the Excel documentation for further details. All of the following functions support absolute references. =cut ############################################################################### ############################################################################### =head2 xl_rowcol_to_cell($row, $col, $row_absolute, $col_absolute) Parameters: $row: Integer $col: Integer $row_absolute: Boolean (1/0) [optional, default is 0] $col_absolute: Boolean (1/0) [optional, default is 0] Returns: A string in A1 cell notation This function converts a zero based row and column cell reference to a A1 style string: $str = xl_rowcol_to_cell(0, 0); # A1 $str = xl_rowcol_to_cell(0, 1); # B1 $str = xl_rowcol_to_cell(1, 0); # A2 The optional parameters C<$row_absolute> and C<$col_absolute> can be used to indicate if the row or column is absolute: $str = xl_rowcol_to_cell(0, 0, 0, 1); # $A1 $str = xl_rowcol_to_cell(0, 0, 1, 0); # A$1 $str = xl_rowcol_to_cell(0, 0, 1, 1); # $A$1 See L for an explanation of absolute cell references. =cut ############################################################################### # # xl_rowcol_to_cell($row, $col, $row_absolute, $col_absolute) # sub xl_rowcol_to_cell { my $row = $_[0]; my $col = $_[1]; my $row_abs = $_[2] ? '$' : ''; my $col_abs = $_[3] ? '$' : ''; my $col_str = ''; # Change from 0-indexed to 1 indexed. $row++; $col++; while ( $col ) { # Set remainder from 1 .. 26 my $remainder = $col % 26 || 26; # Convert the $remainder to a character. C-ishly. my $col_letter = chr( ord( 'A' ) + $remainder - 1 ); # Accumulate the column letters, right to left. $col_str = $col_letter . $col_str; # Get the next order of magnitude. $col = int( ( $col - 1 ) / 26 ); } return $col_abs . $col_str . $row_abs . $row; } ############################################################################### ############################################################################### =head2 xl_cell_to_rowcol($string) Parameters: $string String in A1 format Returns: List ($row, $col) This function converts an Excel cell reference in A1 notation to a zero based row and column. The function will also handle Excel's absolute, C<$>, cell notation. my ($row, $col) = xl_cell_to_rowcol('A1'); # (0, 0) my ($row, $col) = xl_cell_to_rowcol('B1'); # (0, 1) my ($row, $col) = xl_cell_to_rowcol('C2'); # (1, 2) my ($row, $col) = xl_cell_to_rowcol('$C2' ); # (1, 2) my ($row, $col) = xl_cell_to_rowcol('C$2' ); # (1, 2) my ($row, $col) = xl_cell_to_rowcol('$C$2'); # (1, 2) =cut ############################################################################### # # xl_cell_to_rowcol($string) # # Returns: ($row, $col, $row_absolute, $col_absolute) # # The $row_absolute and $col_absolute parameters aren't documented because they # mainly used internally and aren't very useful to the user. # sub xl_cell_to_rowcol { my $cell = shift; $cell =~ /(\$?)([A-Z]{1,3})(\$?)(\d+)/; my $col_abs = $1 eq "" ? 0 : 1; my $col = $2; my $row_abs = $3 eq "" ? 0 : 1; my $row = $4; # Convert base26 column string to number # All your Base are belong to us. my @chars = split //, $col; my $expn = 0; $col = 0; while (@chars) { my $char = pop(@chars); # LS char first $col += (ord($char) -ord('A') +1) * (26**$expn); $expn++; } # Convert 1-index to zero-index $row--; $col--; return $row, $col, $row_abs, $col_abs; } ############################################################################### ############################################################################### =head2 xl_range_formula($sheetname, $row_1, $row_2, $col_1, $col_2) Parameters: $sheetname String $row_1: Integer $row_2: Integer $col_1: Integer $col_2: Integer Returns: A worksheet range formula as a string. This function converts zero based row and column cell references to an A1 style formula string: my $str = xl_range_formula('Sheet1', 0, 9, 0, 0); # =Sheet1!$A$1:$A$10 my $str = xl_range_formula('Sheet2', 6, 65, 1, 1); # =Sheet2!$B$7:$B$66 my $str = xl_range_formula('New data', 1, 8, 2, 2); # ='New data'!$C$2:$C$9 This is useful for setting ranges in Chart objects: $chart->add_series( categories => xl_range_formula('Sheet1', 1, 9, 0, 0), values => xl_range_formula('Sheet1', 1, 9, 1, 1), ); # Which is the same as: $chart->add_series( categories => '=Sheet1!$A$2:$A$10', values => '=Sheet1!$B$2:$B$10', ); =cut ############################################################################### # # xl_range_formula($sheetname, $row_1, $row_2, $col_1, $col_2) # sub xl_range_formula { my ($sheetname, $row_1, $row_2, $col_1, $col_2) = @_; # Use Excel's conventions and quote the sheet name if it contains any # non-word character or if it isn't already quoted. if ($sheetname =~ /\W/ && $sheetname !~ /^'/) { $sheetname = q(') . $sheetname . q('); } my $range1 = xl_rowcol_to_cell($row_1, $col_1, 1, 1); my $range2 = xl_rowcol_to_cell($row_2, $col_2, 1, 1); return '=' . $sheetname . '!' . $range1 . ':' . $range2; } ############################################################################### ############################################################################### =head2 xl_inc_row($string) Parameters: $string, a string in A1 format Returns: Incremented string in A1 format This functions takes a cell reference string in A1 notation and increments the row. The function will also handle Excel's absolute, C<$>, cell notation: my $str = xl_inc_row('A1' ); # A2 my $str = xl_inc_row('B$2' ); # B$3 my $str = xl_inc_row('$C3' ); # $C4 my $str = xl_inc_row('$D$4'); # $D$5 =cut ############################################################################### # # xl_inc_row($string) # sub xl_inc_row { my $cell = shift; my ($row, $col, $row_abs, $col_abs) = xl_cell_to_rowcol($cell); return xl_rowcol_to_cell(++$row, $col, $row_abs, $col_abs); } ############################################################################### ############################################################################### =head2 xl_dec_row($string) Parameters: $string, a string in A1 format Returns: Decremented string in A1 format This functions takes a cell reference string in A1 notation and decrements the row. The function will also handle Excel's absolute, C<$>, cell notation: my $str = xl_dec_row('A2' ); # A1 my $str = xl_dec_row('B$3' ); # B$2 my $str = xl_dec_row('$C4' ); # $C3 my $str = xl_dec_row('$D$5'); # $D$4 =cut ############################################################################### # # xl_dec_row($string) # # Decrements the row number of an Excel cell reference in A1 notation. # For example C4 to C3 # # Returns: a cell reference string. # sub xl_dec_row { my $cell = shift; my ($row, $col, $row_abs, $col_abs) = xl_cell_to_rowcol($cell); return xl_rowcol_to_cell(--$row, $col, $row_abs, $col_abs); } ############################################################################### ############################################################################### =head2 xl_inc_col($string) Parameters: $string, a string in A1 format Returns: Incremented string in A1 format This functions takes a cell reference string in A1 notation and increments the column. The function will also handle Excel's absolute, C<$>, cell notation: my $str = xl_inc_col('A1' ); # B1 my $str = xl_inc_col('Z1' ); # AA1 my $str = xl_inc_col('$B1' ); # $C1 my $str = xl_inc_col('$D$5'); # $E$5 =cut ############################################################################### # # xl_inc_col($string) # # Increments the column number of an Excel cell reference in A1 notation. # For example C3 to D3 # # Returns: a cell reference string. # sub xl_inc_col { my $cell = shift; my ($row, $col, $row_abs, $col_abs) = xl_cell_to_rowcol($cell); return xl_rowcol_to_cell($row, ++$col, $row_abs, $col_abs); } ############################################################################### ############################################################################### =head2 xl_dec_col($string) Parameters: $string, a string in A1 format Returns: Decremented string in A1 format This functions takes a cell reference string in A1 notation and decrements the column. The function will also handle Excel's absolute, C<$>, cell notation: my $str = xl_dec_col('B1' ); # A1 my $str = xl_dec_col('AA1' ); # Z1 my $str = xl_dec_col('$C1' ); # $B1 my $str = xl_dec_col('$E$5'); # $D$5 =cut ############################################################################### # # xl_dec_col($string) # sub xl_dec_col { my $cell = shift; my ($row, $col, $row_abs, $col_abs) = xl_cell_to_rowcol($cell); return xl_rowcol_to_cell($row, --$col, $row_abs, $col_abs); } =head1 TIME AND DATE FUNCTIONS Dates and times in Excel are represented by real numbers, for example "Jan 1 2001 12:30 AM" is represented by the number 36892.521. The integer part of the number stores the number of days since the epoch and the fractional part stores the percentage of the day in seconds. The epoch can be either 1900 or 1904. Excel for Windows uses 1900 and Excel for Macintosh uses 1904. The epochs are: 1900: 0 January 1900 i.e. 31 December 1899 1904: 1 January 1904 Excel on Windows and the Macintosh will convert automatically between one system and the other. By default Spreadsheet::WriteExcel uses the 1900 format. To use the 1904 epoch you must use the C workbook method, see the Spreadsheet::WriteExcel documentation. There are two things to note about the 1900 date format. The first is that the epoch starts on 0 January 1900. The second is that the year 1900 is erroneously but deliberately treated as a leap year. Therefore you must add an extra day to dates after 28 February 1900. The functions in the following section will deal with these issues automatically. The reason for this anomaly is explained at http://support.microsoft.com/support/kb/articles/Q181/3/70.asp Note, a date or time in Excel is like any other number. To display the number as a date you must apply a number format to it: Refer to the C method in the Spreadsheet::WriteExcel documentation: $date = xl_date_list(2001, 1, 1, 12, 30); $format->set_num_format('mmm d yyyy hh:mm AM/PM'); $worksheet->write('A1', $date , $format); # Jan 1 2001 12:30 AM To use these functions you must install the C and C modules. See L and the individual requirements of each functions. See also the DateTime::Format::Excel module,http://search.cpan.org/search?dist=DateTime-Format-Excel which is part of the DateTime project and which deals specifically with converting dates and times to and from Excel's format. =cut ############################################################################### ############################################################################### =head2 xl_date_list($years, $months, $days, $hours, $minutes, $seconds) Parameters: $years: Integer $months: Integer [optional, default is 1] $days: Integer [optional, default is 1] $hours: Integer [optional, default is 0] $minutes: Integer [optional, default is 0] $seconds: Float [optional, default is 0] Returns: A number that represents an Excel date or undef for an invalid date. Requires: Date::Calc This function converts an array of data into a number that represents an Excel date. All of the parameters are optional except for C<$years>. $date1 = xl_date_list(2002, 1, 2); # 2 Jan 2002 $date2 = xl_date_list(2002, 1, 2, 12); # 2 Jan 2002 12:00 pm $date3 = xl_date_list(2002, 1, 2, 12, 30); # 2 Jan 2002 12:30 pm $date4 = xl_date_list(2002, 1, 2, 12, 30, 45); # 2 Jan 2002 12:30:45 pm This function can be used in conjunction with functions that parse date and time strings. In fact it is used in most of the following functions. =cut ############################################################################### # # xl_date_list($years, $months, $days, $hours, $minutes, $seconds) # sub xl_date_list { return undef unless @_; my $years = $_[0]; my $months = $_[1] || 1; my $days = $_[2] || 1; my $hours = $_[3] || 0; my $minutes = $_[4] || 0; my $seconds = $_[5] || 0; my @date = ($years, $months, $days, $hours, $minutes, $seconds); my @epoch = (1899, 12, 31, 0, 0, 0); ($days, $hours, $minutes, $seconds) = Delta_DHMS(@epoch, @date); my $date = $days + ($hours*3600 +$minutes*60 +$seconds)/(24*60*60); # Add a day for Excel's missing leap day in 1900 $date++ if ($date > 59); return $date; } ############################################################################### ############################################################################### =head2 xl_parse_time($string) Parameters: $string, a textual representation of a time Returns: A number that represents an Excel time or undef for an invalid time. This function converts a time string into a number that represents an Excel time. The following time formats are valid: hh:mm [AM|PM] hh:mm [AM|PM] hh:mm:ss [AM|PM] hh:mm:ss.ss [AM|PM] The meridian, AM or PM, is optional and case insensitive. A 24 hour time is assumed if the meridian is omitted $time1 = xl_parse_time('12:18'); $time2 = xl_parse_time('12:18:14'); $time3 = xl_parse_time('12:18:14 AM'); $time4 = xl_parse_time('1:18:14 AM'); Time in Excel is expressed as a fraction of the day in seconds. Therefore you can calculate an Excel time as follows: $time = ($hours*3600 +$minutes*60 +$seconds)/(24*60*60); =cut ############################################################################### # # xl_parse_time($string) # sub xl_parse_time { my $time = shift; if ($time =~ /(\d{1,2}):(\d\d):?((?:\d\d)(?:\.\d+)?)?(?:\s+)?(am|pm)?/i) { my $hours = $1; my $minutes = $2; my $seconds = $3 || 0; my $meridian = lc($4) || ''; # Normalise midnight and midday $hours = 0 if ($hours == 12 && $meridian ne ''); # Add 12 hours to the pm times. Note: 12.00 pm has been set to 0.00. $hours += 12 if $meridian eq 'pm'; # Calculate the time as a fraction of 24 hours in seconds return ($hours*3600 +$minutes*60 +$seconds)/(24*60*60); } else { return undef; # Not a valid time string } } ############################################################################### ############################################################################### =head2 xl_parse_date($string) Parameters: $string, a textual representation of a date and time Returns: A number that represents an Excel date or undef for an invalid date. Requires: Date::Manip and Date::Calc This function converts a date and time string into a number that represents an Excel date. The parsing is performed using the C function of the Date::Manip module. Refer to the Date::Manip documentation for further information about the date and time formats that can be parsed. In order to use this function you will probably have to initialise some Date::Manip variables via the C function, see below. xl_parse_date_init("TZ=GMT","DateFormat=non-US"); $date1 = xl_parse_date("11/7/97"); $date2 = xl_parse_date("Friday 11 July 1997"); $date3 = xl_parse_date("10:30 AM Friday 11 July 1997"); $date4 = xl_parse_date("Today"); $date5 = xl_parse_date("Yesterday"); Note, if you parse a string that represents a time but not a date this function will add the current date. If you want the time without the date you can do something like the following: $time = xl_parse_date("10:30 AM"); $time -= int($time); =cut ############################################################################### # # xl_parse_date($string) # sub xl_parse_date { my $date = ParseDate($_[0]); return undef unless defined $date; # Unpack the return value from ParseDate() my ($years, $months, $days, $hours, undef, $minutes, undef, $seconds) = unpack("A4 A2 A2 A2 C A2 C A2", $date); # Convert to Excel date return xl_date_list($years, $months, $days, $hours, $minutes, $seconds); } ############################################################################### ############################################################################### =head2 xl_parse_date_init("variable=value", ...) Parameters: A list of Date::Manip variable strings Returns: A list of all the Date::Manip strings Requires: Date::Manip This function is used to initialise variables required by the Date::Manip module. You should call this function before calling C. It need only be called once. This function is a thin wrapper for the C function. You can use C directly if you wish. Refer to the Date::Manip documentation for further information. xl_parse_date_init("TZ=MST","DateFormat=US"); $date1 = xl_parse_date("11/7/97"); # November 7th 1997 xl_parse_date_init("TZ=GMT","DateFormat=non-US"); $date1 = xl_parse_date("11/7/97"); # July 11th 1997 =cut ############################################################################### # # xl_parse_date_init("variable=value", ...) # sub xl_parse_date_init { Date_Init(@_); # How lazy is that. } ############################################################################### ############################################################################### =head2 xl_decode_date_EU($string) Parameters: $string, a textual representation of a date and time Returns: A number that represents an Excel date or undef for an invalid date. Requires: Date::Calc This function converts a date and time string into a number that represents an Excel date. The date parsing is performed using the C function of the Date::Calc module. Refer to the Date::Calc for further information about the date formats that can be parsed. Also note the following from the Date::Calc documentation: "If the year is given as one or two digits only (i.e., if the year is less than 100), it is mapped to the window 1970 -2069 as follows": 0 E= $year E 70 ==> $year += 2000; 70 E= $year E 100 ==> $year += 1900; The time portion of the string is parsed using the C function described above. Note: the EU in the function name means that a European date format is assumed if it is not clear from the string. See the first example below. $date1 = xl_decode_date_EU("11/7/97"); #11 July 1997 $date2 = xl_decode_date_EU("Sat 12 Sept 1998"); $date3 = xl_decode_date_EU("4:30 AM Sat 12 Sept 1998"); =cut ############################################################################### # # xl_decode_date_EU($string) # sub xl_decode_date_EU { return undef unless @_; my $date = shift; my @date; my $time = 0; # Remove and decode the time portion of the string if ($date =~ s/(\d{1,2}:\d\d:?(\d\d(\.\d+)?)?(\s+)?(am|pm)?)//i) { $time = xl_parse_time($1); return undef unless defined $time; } # Return if the string is now blank, i.e. it contained a time only. return $time if $date =~ /^\s*$/; # Decode the date portion of the string @date = Decode_Date_EU($date); return undef unless @date; return xl_date_list(@date) + $time; } ############################################################################### ############################################################################### =head2 xl_decode_date_US($string) Parameters: $string, a textual representation of a date and time Returns: A number that represents an Excel date or undef for an invalid date. Requires: Date::Calc This function converts a date and time string into a number that represents an Excel date. The date parsing is performed using the C function of the Date::Calc module. Refer to the Date::Calc for further information about the date formats that can be parsed. Also note the following from the Date::Calc documentation: "If the year is given as one or two digits only (i.e., if the year is less than 100), it is mapped to the window 1970 -2069 as follows": 0 <= $year < 70 ==> $year += 2000; 70 <= $year < 100 ==> $year += 1900; The time portion of the string is parsed using the C function described above. Note: the US in the function name means that an American date format is assumed if it is not clear from the string. See the first example below. $date1 = xl_decode_date_US("11/7/97"); # 7 November 1997 $date2 = xl_decode_date_US("12 Sept Saturday 1998"); $date3 = xl_decode_date_US("4:30 AM 12 Sept Sat 1998"); =cut ############################################################################### # # xl_decode_date_US($string) # sub xl_decode_date_US { return undef unless @_; my $date = shift; my @date; my $time = 0; # Remove and decode the time portion of the string if ($date =~ s/(\d{1,2}:\d\d:?(\d\d(\.\d+)?)?(\s+)?(am|pm)?)//i) { $time = xl_parse_time($1); return undef unless defined $time; } # Return if the string is now blank, i.e. it contained a time only. return $time if $date =~ /^\s*$/; # Decode the date portion of the string @date = Decode_Date_US($date); return undef unless @date; return xl_date_list(@date) + $time; } ############################################################################### ############################################################################### =head2 xl_date_1904($date) Parameters: $date, an Excel date with a 1900 epoch Returns: an Excel date with a 1904 epoch or zero if the $date is before 1904 This function converts an Excel date based on the 1900 epoch into a date based on the 1904 epoch. $date1 = xl_date_list(2002, 1, 13); # 13 Jan 2002, 1900 epoch $date2 = xl_date_1904($date1); # 13 Jan 2002, 1904 epoch See also the C workbook method in the Spreadsheet::WriteExcel documentation. =cut ############################################################################### # # xl_decode_date_US($string) # sub xl_date_1904 { my $date = $_[0] || 0; if ($date < 1462) { # before 1904 $date = 0; } else { $date -= 1462; } return $date; } =head1 REQUIREMENTS The date and time functions require functions from the C and C modules. The required functions are "autoused" from these modules so that you do not have to install them unless you wish to use the date and time routines. Therefore it is possible to use the row and column functions without having C and C installed. For more information about "autousing" refer to the documentation on the C pragma. =head1 BUGS When using the autoused functions from C and C on Perl 5.6.0 with C<-w> you will get a warning like this: "Subroutine xxx redefined ..." The current workaround for this is to put C near the beginning of your program. =head1 AUTHOR John McNamara jmcnamara@cpan.org =head1 COPYRIGHT Copyright MM-MMX, John McNamara. All Rights Reserved. This module is free software. It may be used, redistributed and/or modified under the same terms as Perl itself. =cut 1; __END__