Skip to content

Commit

Permalink
Export UntarFileStream as Ecmascript Module
Browse files Browse the repository at this point in the history
  • Loading branch information
guest271314 authored Apr 10, 2022
1 parent 49e639c commit 9aa53eb
Showing 1 changed file with 263 additions and 0 deletions.
263 changes: 263 additions & 0 deletions src/untar-file-stream.js
Original file line number Diff line number Diff line change
@@ -0,0 +1,263 @@
class PaxHeader {
constructor(fields) {
this._fields = fields;
return this.parse(fields);
}
applyHeader(file) {
// Apply fields to the file
// If a field is of value null, it should be deleted from the file
// https://www.mkssoftware.com/docs/man4/pax.4.asp
this._fields.forEach((field) => {
let fieldName = field.name;
let fieldValue = field.value;

if (fieldName === 'path') {
// This overrides the name and prefix fields in the following header block.
fieldName = 'name';

if (file.prefix !== undefined) {
delete file.prefix;
}
} else if (fieldName === 'linkpath') {
// This overrides the linkname field in the following header block.
fieldName = 'linkname';
}

if (fieldValue === null) {
delete file[fieldName];
} else {
file[fieldName] = fieldValue;
}
});
}
parse(buffer) {
// https://www.ibm.com/support/knowledgecenter/en/SSLTBW_2.3.0/com.ibm.zos.v2r3.bpxa500/paxex.htm
// An extended header shall consist of one or more records, each constructed as follows:
// "%d %s=%s\n", <length>, <keyword>, <value>

// The extended header records shall be encoded according to the ISO/IEC10646-1:2000 standard (UTF-8).
// The <length> field, <blank>, equals sign, and <newline> shown shall be limited to the portable character set, as
// encoded in UTF-8. The <keyword> and <value> fields can be any UTF-8 characters. The <length> field shall be the
// decimal length of the extended header record in octets, including the trailing <newline>.
let decoder = new TextDecoder();
let bytes = new Uint8Array(buffer);
let fields = [];

while (bytes.length > 0) {
// Decode bytes up to the first space character; that is the total field length
let fieldLength = parseInt(
decoder.decode(bytes.subarray(0, bytes.indexOf(0x20)))
);
let fieldText = decoder.decode(bytes.subarray(0, fieldLength));
let fieldMatch = fieldText.match(/^\d+ ([^=]+)=(.*)\n$/);

if (fieldMatch === null) {
throw new Error('Invalid PAX header data format.');
}

let fieldName = fieldMatch[1];
let fieldValue = fieldMatch[2];

if (fieldValue.length === 0) {
fieldValue = null;
} else if (fieldValue.match(/^\d+$/) !== null) {
// If it's a integer field, parse it as int
fieldValue = parseInt(fieldValue);
}
// Don't parse float values since precision is lost
let field = {
name: fieldName,
value: fieldValue,
};

fields.push(field);

bytes = bytes.subarray(fieldLength); // Cut off the parsed field data
}
return fileds;
}
}

class UntarStream {
constructor(arrayBuffer) {
this._bufferView = new DataView(arrayBuffer);
this._position = 0;
}
readString(charCount) {
//console.log("readString: position " + this.position() + ", " + charCount + " chars");
let charSize = 1;
let byteCount = charCount * charSize;

let charCodes = [];

for (let i = 0; i < charCount; ++i) {
let charCode = this._bufferView.getUint8(
this.position() + i * charSize,
true
);
if (charCode !== 0) {
charCodes.push(charCode);
} else {
break;
}
}

this.seek(byteCount);

return new TextDecoder().decode(new Uint8Array(charCodes));
}

readBuffer(byteCount) {
let buf;

if (typeof ArrayBuffer.prototype.slice === 'function') {
buf = this._bufferView.buffer.slice(
this.position(),
this.position() + byteCount
);
} else {
buf = new ArrayBuffer(byteCount);
let target = new Uint8Array(buf);
let src = new Uint8Array(
this._bufferView.buffer,
this.position(),
byteCount
);
target.set(src);
}

this.seek(byteCount);
return buf;
}

seek(byteCount) {
this._position += byteCount;
}

peekUint32() {
return this._bufferView.getUint32(this.position(), true);
}

position(newpos) {
if (newpos === undefined) {
return this._position;
} else {
this._position = newpos;
}
}

size() {
return this._bufferView.byteLength;
}
}

class UntarFileStream {
constructor(arrayBuffer) {
this._stream = new UntarStream(arrayBuffer);
this._globalPaxHeader = null;
}
hasNext() {
return (
this._stream.position() + 4 < this._stream.size() &&
this._stream.peekUint32() !== 0
);
}
next() {
return this._readNextFile();
}
_readNextFile() {
const stream = this._stream;
const file = {};
let isHeaderFile = false;
let paxHeader = null;
let headerBeginPos = stream.position();
let dataBeginPos = headerBeginPos + 512;
// Read header
file.name = stream.readString(100);
file.mode = stream.readString(8);
file.uid = parseInt(stream.readString(8));
file.gid = parseInt(stream.readString(8));
file.size = parseInt(stream.readString(12), 8);
file.mtime = parseInt(stream.readString(12), 8);
file.checksum = parseInt(stream.readString(8));
file.type = stream.readString(1);
file.linkname = stream.readString(100);
file.ustarFormat = stream.readString(6);

if (file.ustarFormat.indexOf('ustar') > -1) {
file.version = stream.readString(2);
file.uname = stream.readString(32);
file.gname = stream.readString(32);
file.devmajor = parseInt(stream.readString(8));
file.devminor = parseInt(stream.readString(8));
file.namePrefix = stream.readString(155);

if (file.namePrefix.length > 0) {
file.name = file.namePrefix + '/' + file.name;
}
}
stream.position(dataBeginPos);
// Derived from https://www.mkssoftware.com/docs/man4/pax.4.asp
// and https://www.ibm.com/support/knowledgecenter/en/SSLTBW_2.3.0/com.ibm.zos.v2r3.bpxa500/pxarchfm.htm
switch (file.type) {
case '0': // Normal file is either "0" or "\0".
case '': // In case of "\0", readString returns an empty string, that is "".
file.buffer = stream.readBuffer(file.size);
break;
case '1': // Link to another file already archived
// TODO Should we do anything with these?
break;
case '2': // Symbolic link
// TODO Should we do anything with these?
break;
case '3': // Character special device (what does this mean??)
break;
case '4': // Block special device
break;
case '5': // Directory
break;
case '6': // FIFO special file
break;
case '7': // Reserved
break;
case 'g': // Global PAX header
isHeaderFile = true;
this._globalPaxHeader = new PaxHeader(stream.readBuffer(file.size));
break;
case 'x': // PAX header
isHeaderFile = true;
paxHeader = new PaxHeader(stream.readBuffer(file.size));
break;
default:
// Unknown file type
break;
}

if (file.buffer === undefined) {
file.buffer = new ArrayBuffer(0);
}

let dataEndPos = dataBeginPos + file.size;
// File data is padded to reach a 512 byte boundary; skip the padded bytes too.
if (file.size % 512 !== 0) {
dataEndPos += 512 - (file.size % 512);
}

stream.position(dataEndPos);

if (isHeaderFile) {
file = this._readNextFile();
}

if (this._globalPaxHeader !== null) {
this._globalPaxHeader.applyHeader(file);
}

if (paxHeader !== null) {
paxHeader.applyHeader(file);
}

return file;
}
}
export { UntarFileStream };

0 comments on commit 9aa53eb

Please sign in to comment.