1
|
<?php
|
2
|
|
3
|
/**
|
4
|
* This exporter creates an XLSX file readable by newer versions of Excel.
|
5
|
*/
|
6
|
class webform_exporter_excel_xlsx extends webform_exporter {
|
7
|
/**
|
8
|
* Regular expression that checks for a valid ISO 8601 date/time.
|
9
|
*/
|
10
|
const DATE_REGEX_ANY = '/^((\d{4})(-(\d{2}))(-(\d{2})))?(([T \s]?(\d{2}))(:(\d{2}))(:(\d{2}))?)?$/';
|
11
|
const DATE_REGEX_DATE = '/^((\d{4})(-(\d{2}))(-(\d{2})))$/';
|
12
|
const DATE_REGEX_TIME = '/^(([T \s]?(\d{2}))(:(\d{2}))(:(\d{2}))?)?$/';
|
13
|
|
14
|
/**
|
15
|
* {@inheritdoc}
|
16
|
*/
|
17
|
public function add_row(&$file_handle, array $data, $row_count) {
|
18
|
$row = $row_count + 1;
|
19
|
$col = 'A';
|
20
|
|
21
|
$output = '<row>';
|
22
|
$utc_timezone = new DateTimeZone('UTC');
|
23
|
foreach ($data as $key => $value) {
|
24
|
// Strip UTF8 characters that are not legal in XML files.
|
25
|
// See http://www.w3.org/TR/xml/#charsets
|
26
|
// See http://stackoverflow.com/questions/3466035/how-to-skip-invalid-characters-in-xml-file-using-php
|
27
|
// @code
|
28
|
// Char ::= #x9 | #xA | #xD | [#x20-#xD7FF] | [#xE000-#xFFFD] | [#x10000-#x10FFFF]
|
29
|
// @endcode
|
30
|
$value = preg_replace('/[^\x{0009}\x{000a}\x{000d}\x{0020}-\x{D7FF}\x{E000}-\x{FFFD}]+/u', '', $value);
|
31
|
|
32
|
$cell_position = $col . $row;
|
33
|
if (strlen($value) === 0) {
|
34
|
// Skip empty cells.
|
35
|
}
|
36
|
elseif (preg_match(self::DATE_REGEX_ANY, $value)) {
|
37
|
// An Excel timestamp is the number of days since Jan 1, 1900, with
|
38
|
// the decimal portion indicating the time (ddddd.tttttt).
|
39
|
// To calculate, take the UNIX timestamp then add the number of days
|
40
|
// between 1900 and 1970 (25568).
|
41
|
$timestamp = date_timestamp_get(date_create($value, $utc_timezone));
|
42
|
$excel_timestamp = ($timestamp / 86400) + 25568;
|
43
|
|
44
|
// 1900 is treated as a leap year, but it is not. So all dates after
|
45
|
// Feb 28, 1900 have one extra day added. That is "59" should be
|
46
|
// March 1, 1900, but it's considered Feb 29, 1900, which didn't exist.
|
47
|
// So all dates greater than 59 have 1 extra day added.
|
48
|
// See http://www.cpearson.com/excel/datetime.htm.
|
49
|
if ($excel_timestamp >= 59) {
|
50
|
$excel_timestamp = $excel_timestamp + 1.0;
|
51
|
}
|
52
|
|
53
|
// Excel does not support dates prior to 0 (Jan 1, 1900). They have to
|
54
|
// be represented as plain-text instead.
|
55
|
if ($excel_timestamp <= 0) {
|
56
|
$output .= '<c r="' . $cell_position . '" t="inlineStr"><is><t>';
|
57
|
$output .= htmlspecialchars($value, ENT_QUOTES);
|
58
|
$output .= '</t></is></c>';
|
59
|
}
|
60
|
// Now after calculating the Excel "timestamp", save it as a decimal
|
61
|
// and point to a style formatter to make it appear as a date/time.
|
62
|
else {
|
63
|
// 1: Dates.
|
64
|
// 2: Times.
|
65
|
// 3: Date times.
|
66
|
// These are tied to style definitions in the styles.xml file
|
67
|
// generated by webform_exporter_excel_xlsx::xlsx_parts().
|
68
|
if (preg_match(self::DATE_REGEX_DATE, $value)) {
|
69
|
$style_format = 1;
|
70
|
}
|
71
|
elseif (preg_match(self::DATE_REGEX_TIME, $value)) {
|
72
|
// Only take the time portion of time values.
|
73
|
$excel_timestamp = $excel_timestamp - (int) $excel_timestamp;
|
74
|
$style_format = 2;
|
75
|
}
|
76
|
else {
|
77
|
$style_format = 3;
|
78
|
}
|
79
|
|
80
|
$output .= '<c r="' . $cell_position . '" s="' . $style_format . '"><v>';
|
81
|
$output .= $excel_timestamp;
|
82
|
$output .= '</v></c>';
|
83
|
}
|
84
|
}
|
85
|
else {
|
86
|
$output .= '<c r="' . $cell_position . '" t="inlineStr"' . ($this->wrappable($row_count, $key, $value) ? ' s="4"' : '') . '><is><t>';
|
87
|
$output .= htmlspecialchars($value, ENT_QUOTES, 'UTF-8');
|
88
|
$output .= '</t></is></c>';
|
89
|
}
|
90
|
|
91
|
// Unbelievably, in PHP you can increment on letters. "Z"++ becomes "AA"
|
92
|
// and "AA"++ becomes "AB", identical to Excel column names.
|
93
|
$col++;
|
94
|
}
|
95
|
$output .= '</row>';
|
96
|
$row++;
|
97
|
|
98
|
@fwrite($file_handle, $output);
|
99
|
}
|
100
|
|
101
|
/**
|
102
|
* Output space for the BOF.
|
103
|
*
|
104
|
* Our beginning of file needs to include unknown data (the number of columns
|
105
|
* and rows) at this point. Instead of writing the true BOF, we output enough
|
106
|
* empty space to fill in the BOF later. See
|
107
|
* webform_exporter_excel_xlsx::eof().
|
108
|
*/
|
109
|
public function bof(&$file_handle) {
|
110
|
$output = str_repeat(' ', 1024);
|
111
|
@fwrite($file_handle, $output . "\n");
|
112
|
}
|
113
|
|
114
|
/**
|
115
|
* Output the BOF and end the file.
|
116
|
*
|
117
|
* We output a chunk of empty data in webform_exporter_excel_xlsx::bof() to
|
118
|
* leave room for our real header, which includes the important <dimension>
|
119
|
* tag. This is required for proper importing into Google Docs.
|
120
|
*/
|
121
|
public function eof(&$file_handle, $row_count, $col_count) {
|
122
|
// Convert column count to letter representation.
|
123
|
$col = 'A';
|
124
|
for ($n = 1; $n < $col_count; $n++) {
|
125
|
$col++;
|
126
|
}
|
127
|
|
128
|
$bof = '';
|
129
|
$bof .= '<?xml version="1.0" encoding="UTF-8" standalone="yes"?>' . "\n";
|
130
|
$bof .= '<worksheet xmlns="http://schemas.openxmlformats.org/spreadsheetml/2006/main">';
|
131
|
$bof .= '<dimension ref="A1:' . $col . $row_count . '"/>';
|
132
|
$bof .= '<sheetData>';
|
133
|
|
134
|
@fseek($file_handle, 0);
|
135
|
@fwrite($file_handle, $bof);
|
136
|
|
137
|
$eof = '';
|
138
|
$eof .= '</sheetData>';
|
139
|
$eof .= '</worksheet>';
|
140
|
|
141
|
fseek($file_handle, 0, SEEK_END);
|
142
|
fwrite($file_handle, $eof);
|
143
|
}
|
144
|
|
145
|
/**
|
146
|
* {@inheritdoc}
|
147
|
*/
|
148
|
public function post_process(&$results) {
|
149
|
// Our download file is currently a single XML sheet file. We need to add
|
150
|
// the peripheral XML files to make this into a XLSX directory, then zip it.
|
151
|
$file_uri = $results['file_name'];
|
152
|
$zip_uri = _webform_export_tempname();
|
153
|
|
154
|
// ZipArchive does not support stream wrappers, convert to filesystem path.
|
155
|
$zip_filepath = drupal_realpath($zip_uri);
|
156
|
$file_filepath = drupal_realpath($file_uri);
|
157
|
$zip = new ZipArchive();
|
158
|
if ($zip->open($zip_filepath, ZipArchive::CREATE) === TRUE) {
|
159
|
// Create a bare-bones Office Open XML format directory structure. This is
|
160
|
// based on the sample simple XLSX file at
|
161
|
// http://blogs.msdn.com/b/chrisrae/archive/2011/08/18/creating-a-simple-xlsx-from-scratch-using-the-open-xml-sdk.aspx
|
162
|
$parts = $this->xlsx_parts();
|
163
|
foreach ($parts as $file_name => $file_contents) {
|
164
|
if (empty($file_contents)) {
|
165
|
$zip->addEmptyDir($file_name);
|
166
|
}
|
167
|
else {
|
168
|
$zip->addFromString($file_name, $file_contents);
|
169
|
}
|
170
|
}
|
171
|
|
172
|
// Add the actual export to the zip.
|
173
|
$zip->addEmptyDir('xl/worksheets');
|
174
|
$zip->addFile($file_filepath, 'xl/worksheets/sheet1.xml');
|
175
|
|
176
|
$zip->close();
|
177
|
|
178
|
// Switch the results file name to the new zip (xlsx) file.
|
179
|
unlink($file_uri);
|
180
|
if (!@rename($zip_uri, $file_uri)) {
|
181
|
// The file could not be renamed, probably due to different stream
|
182
|
// wrappers during drush wfx execution.
|
183
|
copy($zip_uri, $file_uri);
|
184
|
unlink($zip_uri);
|
185
|
}
|
186
|
}
|
187
|
}
|
188
|
|
189
|
/**
|
190
|
* {@inheritdoc}
|
191
|
*/
|
192
|
public function set_headers($filename) {
|
193
|
drupal_add_http_header('Content-Type', 'application/vnd.openxmlformats-officedocument.spreadsheetml.sheet');
|
194
|
drupal_add_http_header('Content-Disposition', "attachment; filename=$filename.xlsx");
|
195
|
drupal_add_http_header('Pragma', 'public');
|
196
|
drupal_add_http_header('Cache-Control', 'max-age=0');
|
197
|
}
|
198
|
|
199
|
/**
|
200
|
* Return all the parts needed to assemble a bare-bones XLSX package.
|
201
|
*/
|
202
|
public function xlsx_parts() {
|
203
|
$parts['_rels'] = '';
|
204
|
$parts['_rels/.rels'] = <<<EOL
|
205
|
<?xml version="1.0" encoding="UTF-8" standalone="yes"?>
|
206
|
<Relationships xmlns="http://schemas.openxmlformats.org/package/2006/relationships">
|
207
|
<Relationship Id="rId1" Type="http://schemas.openxmlformats.org/officeDocument/2006/relationships/officeDocument" Target="xl/workbook.xml"/>
|
208
|
</Relationships>
|
209
|
EOL;
|
210
|
|
211
|
$parts['xl'] = '';
|
212
|
$parts['xl/_rels'] = '';
|
213
|
$parts['xl/_rels/workbook.xml.rels'] = <<<EOL
|
214
|
<?xml version="1.0" encoding="UTF-8" standalone="yes"?>
|
215
|
<Relationships xmlns="http://schemas.openxmlformats.org/package/2006/relationships">
|
216
|
<Relationship Id="rId1" Type="http://schemas.openxmlformats.org/officeDocument/2006/relationships/worksheet" Target="worksheets/sheet1.xml"/>
|
217
|
<Relationship Id="rId2" Type="http://schemas.openxmlformats.org/officeDocument/2006/relationships/styles" Target="styles.xml"/>
|
218
|
</Relationships>
|
219
|
EOL;
|
220
|
$parts['xl/styles.xml'] = <<<EOL
|
221
|
<?xml version="1.0" encoding="UTF-8" standalone="yes"?>
|
222
|
<styleSheet xmlns="http://schemas.openxmlformats.org/spreadsheetml/2006/main">
|
223
|
<fonts count="1"><font><name val="Verdana"/></font></fonts>
|
224
|
<fills count="1"><fill><patternFill patternType="none"/></fill></fills>
|
225
|
<borders count="1"><border><left/><right/><top/><bottom/><diagonal/></border></borders>
|
226
|
<cellStyleXfs count="1"><xf numFmtId="0" fontId="0" fillId="0" borderId="0"/></cellStyleXfs>
|
227
|
<cellXfs count="5">
|
228
|
<xf numFmtId="0" fontId="0" fillId="0" borderId="0" xfId="0"/>
|
229
|
<xf numFmtId="14" fontId="0" fillId="0" borderId="0" xfId="0" applyNumberFormat="1"/>
|
230
|
<xf numFmtId="18" fontId="0" fillId="0" borderId="0" xfId="0" applyNumberFormat="1"/>
|
231
|
<xf numFmtId="22" fontId="0" fillId="0" borderId="0" xfId="0" applyNumberFormat="1"/>
|
232
|
<xf numFmtId="0" fontId="0" fillId="0" borderId="0" xfId="0" applyAlignment="1">
|
233
|
<alignment wrapText="1"/>
|
234
|
</xf>
|
235
|
</cellXfs>
|
236
|
<cellStyles count="1"><cellStyle name="Normal" xfId="0" builtinId="0"/></cellStyles>
|
237
|
<dxfs count="0"/>
|
238
|
<tableStyles count="0"/>
|
239
|
</styleSheet>
|
240
|
EOL;
|
241
|
$parts['xl/workbook.xml'] = <<<EOL
|
242
|
<?xml version="1.0" encoding="UTF-8" standalone="yes"?>
|
243
|
<workbook xmlns="http://schemas.openxmlformats.org/spreadsheetml/2006/main" xmlns:r="http://schemas.openxmlformats.org/officeDocument/2006/relationships">
|
244
|
<workbookPr />
|
245
|
<sheets>
|
246
|
<sheet name="Sheet1" sheetId="1" r:id="rId1"/>
|
247
|
</sheets>
|
248
|
<calcPr calcId="0"/>
|
249
|
<fileRecoveryPr repairLoad="1"/>
|
250
|
</workbook>
|
251
|
EOL;
|
252
|
|
253
|
$parts['[Content_Types].xml'] = <<<EOL
|
254
|
<?xml version="1.0" encoding="UTF-8" standalone="yes"?>
|
255
|
<Types xmlns="http://schemas.openxmlformats.org/package/2006/content-types">
|
256
|
<Default Extension="rels" ContentType="application/vnd.openxmlformats-package.relationships+xml"/>
|
257
|
<Default Extension="xml" ContentType="application/xml"/>
|
258
|
<Override PartName="/xl/workbook.xml" ContentType="application/vnd.openxmlformats-officedocument.spreadsheetml.sheet.main+xml"/>
|
259
|
<Override PartName="/xl/worksheets/sheet1.xml" ContentType="application/vnd.openxmlformats-officedocument.spreadsheetml.worksheet+xml"/>
|
260
|
<Override PartName="/xl/styles.xml" ContentType="application/vnd.openxmlformats-officedocument.spreadsheetml.styles+xml"/>
|
261
|
</Types>
|
262
|
EOL;
|
263
|
|
264
|
return $parts;
|
265
|
}
|
266
|
|
267
|
}
|