forked from exceljs/exceljs
-
Notifications
You must be signed in to change notification settings - Fork 1
/
Copy pathtestSax.js
106 lines (98 loc) · 2.44 KB
/
testSax.js
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
var fs = require('fs');
var events = require('events');
var _ = require('underscore');
var Promise = require('bluebird');
var Sax = require('sax');
var unzip = require('unzip');
var filename = process.argv[2];
var Row = function(r) {
this.number = r;
this.cells = {};
}
Row.prototype = {
add: function(cell) {
this.cells[cell.address] = cell;
}
}
var count = 0;
var e = new events.EventEmitter();
e.on('row', function(row) {
count++;
if (count % 1000 === 0) {
process.stdout.write('Count:' + count + '\u001b[0G'); // "\033[0G"
}
});
e.on('finished', function() {
console.log('Finished worksheet: ' + count);
});
var zip = unzip.Parse();
zip.on('entry',function (entry) {
if (entry.path.match(/xl\/worksheets\/sheet\d+[.]xml/)) {
parseSheet(entry,e);
}
});
function parseSheet(entry, emitter) {
var parser = Sax.createStream(true, {});
var row = null;
var cell = null;
var current = null;
parser.on('opentag', function(node) {
switch(node.name) {
case 'row':
var r = parseInt(node.attributes.r);
row = new Row(r);
break;
case 'c':
cell = {
address: node.attributes.r,
s: parseInt(node.attributes.s),
t: node.attributes.t
};
break;
case 'v':
current = cell.v = { text: '' };
break;
case 'f':
current = cell.f = { text: '' };
break;
}
});
parser.on('text', function (text) {
if (current) {
current.text += text;
}
});
parser.on('closetag', function(name) {
switch(name) {
case 'row':
emitter.emit('row', row);
row = null;
break;
case 'c':
row.add(cell);
break;
}
});
parser.on('end', function() {
e.emit('finished');
});
entry.pipe(parser);
}
var stream = fs.createReadStream(filename);
var eod = false;
stream.on('end', function() {
eod = true;
});
function schedule() {
setImmediate(function() {
if (!eod) {
var data = stream.read(16384);
if (data && data.length) {
zip.write(data);
}
schedule();
}
});
}
//stream.pipe(zip);
schedule();