_stream_transform.js 7.8 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190
  1. // Copyright Joyent, Inc. and other Node contributors.
  2. //
  3. // Permission is hereby granted, free of charge, to any person obtaining a
  4. // copy of this software and associated documentation files (the
  5. // "Software"), to deal in the Software without restriction, including
  6. // without limitation the rights to use, copy, modify, merge, publish,
  7. // distribute, sublicense, and/or sell copies of the Software, and to permit
  8. // persons to whom the Software is furnished to do so, subject to the
  9. // following conditions:
  10. //
  11. // The above copyright notice and this permission notice shall be included
  12. // in all copies or substantial portions of the Software.
  13. //
  14. // THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS
  15. // OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
  16. // MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN
  17. // NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM,
  18. // DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR
  19. // OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE
  20. // USE OR OTHER DEALINGS IN THE SOFTWARE.
  21. // a transform stream is a readable/writable stream where you do
  22. // something with the data. Sometimes it's called a "filter",
  23. // but that's not a great name for it, since that implies a thing where
  24. // some bits pass through, and others are simply ignored. (That would
  25. // be a valid example of a transform, of course.)
  26. //
  27. // While the output is causally related to the input, it's not a
  28. // necessarily symmetric or synchronous transformation. For example,
  29. // a zlib stream might take multiple plain-text writes(), and then
  30. // emit a single compressed chunk some time in the future.
  31. //
  32. // Here's how this works:
  33. //
  34. // The Transform stream has all the aspects of the readable and writable
  35. // stream classes. When you write(chunk), that calls _write(chunk,cb)
  36. // internally, and returns false if there's a lot of pending writes
  37. // buffered up. When you call read(), that calls _read(n) until
  38. // there's enough pending readable data buffered up.
  39. //
  40. // In a transform stream, the written data is placed in a buffer. When
  41. // _read(n) is called, it transforms the queued up data, calling the
  42. // buffered _write cb's as it consumes chunks. If consuming a single
  43. // written chunk would result in multiple output chunks, then the first
  44. // outputted bit calls the readcb, and subsequent chunks just go into
  45. // the read buffer, and will cause it to emit 'readable' if necessary.
  46. //
  47. // This way, back-pressure is actually determined by the reading side,
  48. // since _read has to be called to start processing a new chunk. However,
  49. // a pathological inflate type of transform can cause excessive buffering
  50. // here. For example, imagine a stream where every byte of input is
  51. // interpreted as an integer from 0-255, and then results in that many
  52. // bytes of output. Writing the 4 bytes {ff,ff,ff,ff} would result in
  53. // 1kb of data being output. In this case, you could write a very small
  54. // amount of input, and end up with a very large amount of output. In
  55. // such a pathological inflating mechanism, there'd be no way to tell
  56. // the system to stop doing the transform. A single 4MB write could
  57. // cause the system to run out of memory.
  58. //
  59. // However, even in such a pathological case, only a single written chunk
  60. // would be consumed, and then the rest would wait (un-transformed) until
  61. // the results of the previous transformed chunk were consumed.
  62. 'use strict';
  63. module.exports = Transform;
  64. var _require$codes = require('../errors').codes,
  65. ERR_METHOD_NOT_IMPLEMENTED = _require$codes.ERR_METHOD_NOT_IMPLEMENTED,
  66. ERR_MULTIPLE_CALLBACK = _require$codes.ERR_MULTIPLE_CALLBACK,
  67. ERR_TRANSFORM_ALREADY_TRANSFORMING = _require$codes.ERR_TRANSFORM_ALREADY_TRANSFORMING,
  68. ERR_TRANSFORM_WITH_LENGTH_0 = _require$codes.ERR_TRANSFORM_WITH_LENGTH_0;
  69. var Duplex = require('./_stream_duplex');
  70. require('inherits')(Transform, Duplex);
  71. function afterTransform(er, data) {
  72. var ts = this._transformState;
  73. ts.transforming = false;
  74. var cb = ts.writecb;
  75. if (cb === null) {
  76. return this.emit('error', new ERR_MULTIPLE_CALLBACK());
  77. }
  78. ts.writechunk = null;
  79. ts.writecb = null;
  80. if (data != null)
  81. // single equals check for both `null` and `undefined`
  82. this.push(data);
  83. cb(er);
  84. var rs = this._readableState;
  85. rs.reading = false;
  86. if (rs.needReadable || rs.length < rs.highWaterMark) {
  87. this._read(rs.highWaterMark);
  88. }
  89. }
  90. function Transform(options) {
  91. if (!(this instanceof Transform)) return new Transform(options);
  92. Duplex.call(this, options);
  93. this._transformState = {
  94. afterTransform: afterTransform.bind(this),
  95. needTransform: false,
  96. transforming: false,
  97. writecb: null,
  98. writechunk: null,
  99. writeencoding: null
  100. };
  101. // start out asking for a readable event once data is transformed.
  102. this._readableState.needReadable = true;
  103. // we have implemented the _read method, and done the other things
  104. // that Readable wants before the first _read call, so unset the
  105. // sync guard flag.
  106. this._readableState.sync = false;
  107. if (options) {
  108. if (typeof options.transform === 'function') this._transform = options.transform;
  109. if (typeof options.flush === 'function') this._flush = options.flush;
  110. }
  111. // When the writable side finishes, then flush out anything remaining.
  112. this.on('prefinish', prefinish);
  113. }
  114. function prefinish() {
  115. var _this = this;
  116. if (typeof this._flush === 'function' && !this._readableState.destroyed) {
  117. this._flush(function (er, data) {
  118. done(_this, er, data);
  119. });
  120. } else {
  121. done(this, null, null);
  122. }
  123. }
  124. Transform.prototype.push = function (chunk, encoding) {
  125. this._transformState.needTransform = false;
  126. return Duplex.prototype.push.call(this, chunk, encoding);
  127. };
  128. // This is the part where you do stuff!
  129. // override this function in implementation classes.
  130. // 'chunk' is an input chunk.
  131. //
  132. // Call `push(newChunk)` to pass along transformed output
  133. // to the readable side. You may call 'push' zero or more times.
  134. //
  135. // Call `cb(err)` when you are done with this chunk. If you pass
  136. // an error, then that'll put the hurt on the whole operation. If you
  137. // never call cb(), then you'll never get another chunk.
  138. Transform.prototype._transform = function (chunk, encoding, cb) {
  139. cb(new ERR_METHOD_NOT_IMPLEMENTED('_transform()'));
  140. };
  141. Transform.prototype._write = function (chunk, encoding, cb) {
  142. var ts = this._transformState;
  143. ts.writecb = cb;
  144. ts.writechunk = chunk;
  145. ts.writeencoding = encoding;
  146. if (!ts.transforming) {
  147. var rs = this._readableState;
  148. if (ts.needTransform || rs.needReadable || rs.length < rs.highWaterMark) this._read(rs.highWaterMark);
  149. }
  150. };
  151. // Doesn't matter what the args are here.
  152. // _transform does all the work.
  153. // That we got here means that the readable side wants more data.
  154. Transform.prototype._read = function (n) {
  155. var ts = this._transformState;
  156. if (ts.writechunk !== null && !ts.transforming) {
  157. ts.transforming = true;
  158. this._transform(ts.writechunk, ts.writeencoding, ts.afterTransform);
  159. } else {
  160. // mark that we need a transform, so that any data that comes in
  161. // will get processed, now that we've asked for it.
  162. ts.needTransform = true;
  163. }
  164. };
  165. Transform.prototype._destroy = function (err, cb) {
  166. Duplex.prototype._destroy.call(this, err, function (err2) {
  167. cb(err2);
  168. });
  169. };
  170. function done(stream, er, data) {
  171. if (er) return stream.emit('error', er);
  172. if (data != null)
  173. // single equals check for both `null` and `undefined`
  174. stream.push(data);
  175. // TODO(BridgeAR): Write a test for these two error cases
  176. // if there's nothing in the write buffer, then that means
  177. // that nothing more will ever be provided
  178. if (stream._writableState.length) throw new ERR_TRANSFORM_WITH_LENGTH_0();
  179. if (stream._transformState.transforming) throw new ERR_TRANSFORM_ALREADY_TRANSFORMING();
  180. return stream.push(null);
  181. }