mirror of
https://github.com/denoland/std.git
synced 2024-11-21 20:50:22 +00:00
498 lines
15 KiB
TypeScript
498 lines
15 KiB
TypeScript
// Copyright 2018-2024 the Deno authors. All rights reserved. MIT license.
|
|
/*!
|
|
* Ported and modified from: https://github.com/beatgammit/tar-js and
|
|
* licensed as:
|
|
*
|
|
* (The MIT License)
|
|
*
|
|
* Copyright (c) 2011 T. Jameson Little
|
|
* Copyright (c) 2019 Jun Kato
|
|
* Copyright (c) 2018-2024 the Deno authors
|
|
*
|
|
* Permission is hereby granted, free of charge, to any person obtaining a copy
|
|
* of this software and associated documentation files (the "Software"), to deal
|
|
* in the Software without restriction, including without limitation the rights
|
|
* to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
|
|
* copies of the Software, and to permit persons to whom the Software is
|
|
* furnished to do so, subject to the following conditions:
|
|
*
|
|
* The above copyright notice and this permission notice shall be included in
|
|
* all copies or substantial portions of the Software.
|
|
*
|
|
* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
|
|
* IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
|
|
* FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
|
|
* AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
|
|
* LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
|
|
* OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
|
|
* THE SOFTWARE.
|
|
*/
|
|
|
|
import {
|
|
FileTypes,
|
|
type TarInfo,
|
|
type TarMeta,
|
|
USTAR_STRUCTURE,
|
|
} from "./_common.ts";
|
|
import type { Reader } from "@std/io/types";
|
|
import { MultiReader } from "./_multi_reader.ts";
|
|
import { Buffer } from "@std/io/buffer";
|
|
import { HEADER_LENGTH } from "./_common.ts";
|
|
|
|
export type { TarInfo, TarMeta };
|
|
|
|
/**
|
|
* Options for {@linkcode Tar.append}.
|
|
*
|
|
* @deprecated Use {@linkcode https://jsr.io/@std/tar | @std/tar} instead.
|
|
* `@std/archive` will be removed in the future.
|
|
*
|
|
* @experimental **UNSTABLE**: New API, yet to be vetted.
|
|
*/
|
|
export interface TarOptions extends TarInfo {
|
|
/**
|
|
* Filepath of the file to append to the archive
|
|
*/
|
|
filePath?: string;
|
|
|
|
/**
|
|
* A Reader of any arbitrary content to append to the archive
|
|
*/
|
|
reader?: Reader;
|
|
|
|
/**
|
|
* Size of the content to be appended. This is only required
|
|
* when passing a reader to the archive.
|
|
*/
|
|
contentSize?: number;
|
|
}
|
|
|
|
const USTAR_MAGIC_HEADER = "ustar\u000000" as const;
|
|
|
|
/**
|
|
* Simple file reader
|
|
*/
|
|
class FileReader implements Reader {
|
|
#file: Deno.FsFile | undefined;
|
|
#filePath: string;
|
|
|
|
constructor(filePath: string) {
|
|
this.#filePath = filePath;
|
|
}
|
|
|
|
async read(p: Uint8Array): Promise<number | null> {
|
|
if (!this.#file) {
|
|
this.#file = await Deno.open(this.#filePath, { read: true });
|
|
}
|
|
const res = await this.#file.read(p);
|
|
if (res === null) {
|
|
this.#file.close();
|
|
this.#file = undefined;
|
|
}
|
|
return res;
|
|
}
|
|
}
|
|
|
|
/**
|
|
* Pads a number with leading zeros to a specified number of bytes.
|
|
*
|
|
* @param num The number to pad.
|
|
* @param bytes The number of bytes to pad the number to.
|
|
* @returns The padded number as a string.
|
|
*/
|
|
function pad(num: number, bytes: number): string {
|
|
return num.toString(8).padStart(bytes, "0");
|
|
}
|
|
|
|
/**
|
|
* Formats the header data for a tar file entry.
|
|
*
|
|
* @param data The data object containing the values for the tar header fields.
|
|
* @returns The formatted header data as a Uint8Array.
|
|
*/
|
|
function formatHeader(data: TarData): Uint8Array {
|
|
const encoder = new TextEncoder();
|
|
const buffer = new Uint8Array(HEADER_LENGTH);
|
|
let offset = 0;
|
|
for (const { field, length } of USTAR_STRUCTURE) {
|
|
const entry = encoder.encode(data[field as keyof TarData] ?? "");
|
|
buffer.set(entry, offset);
|
|
offset += length;
|
|
}
|
|
return buffer;
|
|
}
|
|
|
|
/**
|
|
* Base interface for {@linkcode TarDataWithSource}.
|
|
*
|
|
* @deprecated Use {@linkcode https://jsr.io/@std/tar | @std/tar} instead.
|
|
* `@std/archive` will be removed in the future.
|
|
*
|
|
* @experimental **UNSTABLE**: New API, yet to be vetted.
|
|
*/
|
|
export interface TarData {
|
|
/** Name of the file, excluding directory names (if any). */
|
|
fileName?: string;
|
|
/** Directory names preceding the file name (if any). */
|
|
fileNamePrefix?: string;
|
|
/**
|
|
* The underlying raw `st_mode` bits that contain the standard Unix
|
|
* permissions for this file/directory.
|
|
*/
|
|
fileMode?: string;
|
|
/**
|
|
* Numeric user ID of the file owner. This is ignored if the operating system
|
|
* does not support numeric user IDs.
|
|
*/
|
|
uid?: string;
|
|
/**
|
|
* Numeric group ID of the file owner. This is ignored if the operating
|
|
* system does not support numeric group IDs.
|
|
*/
|
|
gid?: string;
|
|
/**
|
|
* The size of the file in bytes; for archive members that are symbolic or
|
|
* hard links to another file, this field is specified as zero.
|
|
*/
|
|
fileSize?: string;
|
|
/**
|
|
* Data modification time of the file at the time it was archived. It
|
|
* represents the integer number of seconds since January 1, 1970, 00:00 UTC.
|
|
*/
|
|
mtime?: string;
|
|
/** The simple sum of all bytes in the header block */
|
|
checksum?: string;
|
|
/**
|
|
* The type of file archived.
|
|
*
|
|
* @see {@linkcode FileTypes}
|
|
*/
|
|
type?: string;
|
|
/** Ustar magic header */
|
|
ustar?: string;
|
|
/** The name of the file owner. */
|
|
owner?: string;
|
|
/** The group that the file owner belongs to. */
|
|
group?: string;
|
|
}
|
|
|
|
/**
|
|
* Tar data interface for {@linkcode Tar.data}.
|
|
*
|
|
* @deprecated Use {@linkcode https://jsr.io/@std/tar | @std/tar} instead.
|
|
* `@std/archive` will be removed in the future.
|
|
*
|
|
* @experimental **UNSTABLE**: New API, yet to be vetted.
|
|
*/
|
|
export interface TarDataWithSource extends TarData {
|
|
/**
|
|
* Path of the file to read.
|
|
*/
|
|
filePath?: string;
|
|
/**
|
|
* Buffer reader.
|
|
*/
|
|
reader?: Reader;
|
|
}
|
|
|
|
/**
|
|
* ### Overview
|
|
* A class to create a tar archive. Tar archives allow for storing multiple files in a
|
|
* single file (called an archive, or sometimes a tarball). These archives typically
|
|
* have the '.tar' extension.
|
|
*
|
|
* @deprecated Use {@linkcode https://jsr.io/@std/tar | @std/tar} instead.
|
|
* `@std/archive` will be removed in the future.
|
|
*
|
|
* ### Usage
|
|
* The workflow is to create a Tar instance, append files to it, and then write the
|
|
* tar archive to the filesystem (or other output stream). See the worked example
|
|
* below for details.
|
|
*
|
|
* ### Compression
|
|
* Tar archives are not compressed by default. If you want to compress the archive,
|
|
* you may compress the tar archive after creation, but this capability is not provided
|
|
* here.
|
|
*
|
|
* ### File format and limitations
|
|
*
|
|
* The ustar file format is used for creating the archive file.
|
|
* While this format is compatible with most tar readers,
|
|
* the format has several limitations, including:
|
|
* * Files must be smaller than 8GiB
|
|
* * Filenames (including path) must be shorter than 256 characters
|
|
* * Filenames (including path) cannot contain non-ASCII characters
|
|
* * Sparse files are not supported
|
|
*
|
|
* @example Usage
|
|
* ```ts ignore
|
|
* import { Tar } from "@std/archive/tar";
|
|
* import { Buffer } from "@std/io/buffer";
|
|
* import { copy } from "@std/io/copy";
|
|
*
|
|
* const tar = new Tar();
|
|
*
|
|
* // Now that we've created our tar, let's add some files to it:
|
|
*
|
|
* const content = new TextEncoder().encode("Some arbitrary content");
|
|
* await tar.append("deno.txt", {
|
|
* reader: new Buffer(content),
|
|
* contentSize: content.byteLength,
|
|
* });
|
|
*
|
|
* // This file is sourced from the filesystem (and renamed in the archive)
|
|
* await tar.append("filename_in_archive.txt", {
|
|
* filePath: "./filename_on_filesystem.txt",
|
|
* });
|
|
*
|
|
* // Now let's write the tar (with its two files) to the filesystem
|
|
* // use tar.getReader() to read the contents.
|
|
*
|
|
* const writer = await Deno.open("./out.tar", { write: true, create: true });
|
|
* await copy(tar.getReader(), writer);
|
|
* writer.close();
|
|
* ```
|
|
*
|
|
* @experimental **UNSTABLE**: New API, yet to be vetted.
|
|
*/
|
|
export class Tar {
|
|
/** Tar data. */
|
|
#data: TarDataWithSource[];
|
|
|
|
/** Constructs a new instance. */
|
|
constructor() {
|
|
this.#data = [];
|
|
}
|
|
|
|
/**
|
|
* Append a file or reader of arbitrary content to this tar archive. Directories
|
|
* appended to the archive append only the directory itself to the archive, not
|
|
* its contents. To add a directory and its contents, recursively append the
|
|
* directory's contents. Directories and subdirectories will be created automatically
|
|
* in the archive as required.
|
|
*
|
|
* @param filenameInArchive File name of the content in the archive. E.g.
|
|
* `test.txt`. Use slash for directory separators.
|
|
* @param source Details of the source of the content including the
|
|
* reference to the content itself and potentially any related metadata.
|
|
*
|
|
* @example Usage
|
|
* ```ts ignore
|
|
* import { Tar } from "@std/archive/tar";
|
|
* import { Buffer } from "@std/io/buffer";
|
|
* import { copy } from "@std/io/copy";
|
|
*
|
|
* const tar = new Tar();
|
|
*
|
|
* // Now that we've created our tar, let's add some files to it:
|
|
*
|
|
* const content = new TextEncoder().encode("Some arbitrary content");
|
|
* await tar.append("deno.txt", {
|
|
* reader: new Buffer(content),
|
|
* contentSize: content.byteLength,
|
|
* });
|
|
*
|
|
* // This file is sourced from the filesystem (and renamed in the archive)
|
|
* await tar.append("filename_in_archive.txt", {
|
|
* filePath: "./filename_on_filesystem.txt",
|
|
* });
|
|
*
|
|
* // Now let's write the tar (with its two files) to the filesystem
|
|
* // use tar.getReader() to read the contents.
|
|
*
|
|
* const writer = await Deno.open("./out.tar", { write: true, create: true });
|
|
* await copy(tar.getReader(), writer);
|
|
* writer.close();
|
|
* ```
|
|
*/
|
|
async append(filenameInArchive: string, source: TarOptions) {
|
|
if (typeof filenameInArchive !== "string") {
|
|
throw new Error("Cannot append data: File name is not a string");
|
|
}
|
|
let fileName = filenameInArchive;
|
|
|
|
/**
|
|
* Ustar format has a limitation of file name length. Specifically:
|
|
* 1. File names can contain at most 255 bytes.
|
|
* 2. File names longer than 100 bytes must be split at a directory separator in two parts,
|
|
* the first being at most 155 bytes long. So, in most cases file names must be a bit shorter
|
|
* than 255 bytes.
|
|
*/
|
|
// separate file name into two parts if needed
|
|
let fileNamePrefix: string | undefined;
|
|
if (fileName.length > 100) {
|
|
let i = fileName.length;
|
|
while (i >= 0) {
|
|
i = fileName.lastIndexOf("/", i);
|
|
if (i <= 155) {
|
|
fileNamePrefix = fileName.slice(0, i);
|
|
fileName = fileName.slice(i + 1);
|
|
break;
|
|
}
|
|
i--;
|
|
}
|
|
const errMsg =
|
|
"Cannot append data: The 'ustar' format does not allow a long file name (length of [file name" +
|
|
"prefix] + / + [file name] must be shorter than 256 bytes)";
|
|
if (i < 0 || fileName.length > 100) {
|
|
throw new Error(errMsg);
|
|
} else {
|
|
if (fileNamePrefix === undefined) {
|
|
throw new TypeError("File name prefix is undefined");
|
|
}
|
|
if (fileNamePrefix.length > 155) {
|
|
throw new Error(errMsg);
|
|
}
|
|
}
|
|
}
|
|
|
|
source = source ?? {};
|
|
|
|
// set meta data
|
|
let info: Deno.FileInfo | undefined;
|
|
if (source.filePath) {
|
|
info = await Deno.stat(source.filePath);
|
|
if (info.isDirectory) {
|
|
info.size = 0;
|
|
source.reader = new Buffer();
|
|
}
|
|
}
|
|
|
|
const mode = source.fileMode || (info && info.mode) ||
|
|
parseInt("777", 8) & 0xfff /* 511 */;
|
|
const mtime = Math.floor(
|
|
source.mtime ?? (info?.mtime ?? new Date()).valueOf() / 1000,
|
|
);
|
|
const uid = source.uid ?? 0;
|
|
const gid = source.gid ?? 0;
|
|
|
|
if (typeof source.owner === "string" && source.owner.length >= 32) {
|
|
throw new Error(
|
|
"Cannot append data: The 'ustar' format does not allow owner name length >= 32 bytes",
|
|
);
|
|
}
|
|
if (typeof source.group === "string" && source.group.length >= 32) {
|
|
throw new Error(
|
|
"Cannot append data: The 'ustar' format does not allow group name length >= 32 bytes",
|
|
);
|
|
}
|
|
|
|
const fileSize = info?.size ?? source.contentSize;
|
|
if (fileSize === undefined) {
|
|
throw new TypeError("Cannot append data: The file size is not defined");
|
|
}
|
|
|
|
const type = source.type
|
|
? FileTypes[source.type as keyof typeof FileTypes]
|
|
: (info?.isDirectory ? FileTypes.directory : FileTypes.file);
|
|
const tarData: TarDataWithSource = {
|
|
fileName,
|
|
fileMode: pad(mode, 7),
|
|
uid: pad(uid, 7),
|
|
gid: pad(gid, 7),
|
|
fileSize: pad(fileSize, 11),
|
|
mtime: pad(mtime, 11),
|
|
checksum: " ",
|
|
type: type.toString(),
|
|
ustar: USTAR_MAGIC_HEADER,
|
|
owner: source.owner ?? "",
|
|
group: source.group ?? "",
|
|
};
|
|
if (fileNamePrefix !== undefined) {
|
|
tarData.fileNamePrefix = fileNamePrefix;
|
|
}
|
|
if (source.filePath !== undefined) {
|
|
tarData.filePath = source.filePath;
|
|
}
|
|
if (source.reader !== undefined) {
|
|
tarData.reader = source.reader;
|
|
}
|
|
|
|
// calculate the checksum
|
|
let checksum = 0;
|
|
const encoder = new TextEncoder();
|
|
Object.keys(tarData)
|
|
.filter((key): boolean => ["filePath", "reader"].indexOf(key) < 0)
|
|
.forEach(function (key) {
|
|
checksum += encoder
|
|
.encode(tarData[key as keyof TarData])
|
|
.reduce((p, c): number => p + c, 0);
|
|
});
|
|
|
|
tarData.checksum = pad(checksum, 6) + "\u0000 ";
|
|
this.#data.push(tarData);
|
|
}
|
|
|
|
/**
|
|
* Get a {@linkcode Reader} instance for this tar archive.
|
|
*
|
|
* @returns A reader instance for the tar archive.
|
|
*
|
|
* @example Usage
|
|
* ```ts ignore
|
|
* import { Tar } from "@std/archive/tar";
|
|
* import { Buffer } from "@std/io/buffer";
|
|
* import { copy } from "@std/io/copy";
|
|
*
|
|
* const tar = new Tar();
|
|
*
|
|
* // Now that we've created our tar, let's add some files to it:
|
|
*
|
|
* const content = new TextEncoder().encode("Some arbitrary content");
|
|
* await tar.append("deno.txt", {
|
|
* reader: new Buffer(content),
|
|
* contentSize: content.byteLength,
|
|
* });
|
|
*
|
|
* // This file is sourced from the filesystem (and renamed in the archive)
|
|
* await tar.append("filename_in_archive.txt", {
|
|
* filePath: "./filename_on_filesystem.txt",
|
|
* });
|
|
*
|
|
* // Now let's write the tar (with its two files) to the filesystem
|
|
* // use tar.getReader() to read the contents.
|
|
*
|
|
* const writer = await Deno.open("./out.tar", { write: true, create: true });
|
|
* await copy(tar.getReader(), writer);
|
|
* writer.close();
|
|
* ```
|
|
*/
|
|
getReader(): Reader {
|
|
const readers: Reader[] = [];
|
|
this.#data.forEach((tarData) => {
|
|
let { reader } = tarData;
|
|
const { filePath } = tarData;
|
|
const headerArr = formatHeader(tarData);
|
|
readers.push(new Buffer(headerArr));
|
|
if (!reader) {
|
|
if (filePath === undefined) {
|
|
throw new TypeError(
|
|
"Cannot get the reader for the tar archive: FilePath is not defined",
|
|
);
|
|
}
|
|
reader = new FileReader(filePath);
|
|
}
|
|
readers.push(reader);
|
|
|
|
// to the nearest multiple of recordSize
|
|
if (tarData.fileSize === undefined) {
|
|
throw new TypeError(
|
|
"Cannot get the reader for the tar archive: FileSize is not defined",
|
|
);
|
|
}
|
|
readers.push(
|
|
new Buffer(
|
|
new Uint8Array(
|
|
HEADER_LENGTH -
|
|
(parseInt(tarData.fileSize, 8) % HEADER_LENGTH || HEADER_LENGTH),
|
|
),
|
|
),
|
|
);
|
|
});
|
|
|
|
// append 2 empty records
|
|
readers.push(new Buffer(new Uint8Array(HEADER_LENGTH * 2)));
|
|
return new MultiReader(readers);
|
|
}
|
|
}
|