123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527 |
- /**
- * Copyright (c) 2022 mol* contributors, licensed under MIT, See LICENSE file for more info.
- *
- * Adapted from https://github.com/cheminfo-js/netcdfjs
- * MIT License, Copyright (c) 2016 cheminfo
- *
- * @author Alexander Rose <alexander.rose@weirdbyte.de>
- */
- import { IOBuffer } from '../io-buffer';
- export interface NetCDFRecordDimension {
- length: number,
- id?: number,
- name?: string,
- recordStep?: number
- }
- export interface NetCDFVariable {
- name: string
- dimensions: any[]
- attributes: any[]
- type: string
- size: number
- offset: number
- record: boolean
- }
- export interface NetCDFHeader {
- recordDimension: NetCDFRecordDimension,
- version: number,
- dimensions: { name: string, size: number }[],
- globalAttributes: { name: string, type: string, value: string | number }[],
- variables: NetCDFVariable[]
- }
- export interface NetCDFDimension {
- name: string,
- size: number
- }
- /**
- * Throws a non-valid NetCDF exception if the statement it's true
- */
- function notNetcdf(statement: boolean, reason: string) {
- if (statement) {
- throw new TypeError('Not a valid NetCDF v3.x file: ' + reason);
- }
- }
- /**
- * Moves 1, 2, or 3 bytes to next 4-byte boundary
- */
- function padding(buffer: IOBuffer) {
- if ((buffer.offset % 4) !== 0) {
- buffer.skip(4 - (buffer.offset % 4));
- }
- }
- /**
- * Reads the name
- */
- function readName(buffer: IOBuffer) {
- // Read name
- const nameLength = buffer.readUint32();
- const name = buffer.readChars(nameLength);
- // validate name
- // TODO
- // Apply padding
- padding(buffer);
- return name;
- }
- const types = {
- BYTE: 1,
- CHAR: 2,
- SHORT: 3,
- INT: 4,
- FLOAT: 5,
- DOUBLE: 6
- };
- /**
- * Parse a number into their respective type
- */
- function num2str(type: number) {
- switch (Number(type)) {
- case types.BYTE:
- return 'byte';
- case types.CHAR:
- return 'char';
- case types.SHORT:
- return 'short';
- case types.INT:
- return 'int';
- case types.FLOAT:
- return 'float';
- case types.DOUBLE:
- return 'double';
- default:
- return 'undefined';
- }
- }
- /**
- * Parse a number type identifier to his size in bytes
- */
- function num2bytes(type: number) {
- switch (Number(type)) {
- case types.BYTE:
- return 1;
- case types.CHAR:
- return 1;
- case types.SHORT:
- return 2;
- case types.INT:
- return 4;
- case types.FLOAT:
- return 4;
- case types.DOUBLE:
- return 8;
- default:
- return -1;
- }
- }
- /**
- * Reverse search of num2str
- */
- function str2num(type: string) {
- switch (String(type)) {
- case 'byte':
- return types.BYTE;
- case 'char':
- return types.CHAR;
- case 'short':
- return types.SHORT;
- case 'int':
- return types.INT;
- case 'float':
- return types.FLOAT;
- case 'double':
- return types.DOUBLE;
- default:
- return -1;
- }
- }
- /**
- * Auxiliary function to read numeric data
- */
- function readNumber(size: number, bufferReader: Function) {
- if (size !== 1) {
- const numbers = new Array(size);
- for (let i = 0; i < size; i++) {
- numbers[i] = bufferReader();
- }
- return numbers;
- } else {
- return bufferReader();
- }
- }
- /**
- * Given a type and a size reads the next element
- */
- function readType(buffer: IOBuffer, type: number, size: number) {
- switch (type) {
- case types.BYTE:
- return buffer.readBytes(size);
- case types.CHAR:
- return trimNull(buffer.readChars(size));
- case types.SHORT:
- return readNumber(size, buffer.readInt16.bind(buffer));
- case types.INT:
- return readNumber(size, buffer.readInt32.bind(buffer));
- case types.FLOAT:
- return readNumber(size, buffer.readFloat32.bind(buffer));
- case types.DOUBLE:
- return readNumber(size, buffer.readFloat64.bind(buffer));
- default:
- notNetcdf(true, 'non valid type ' + type);
- return undefined;
- }
- }
- /**
- * Removes null terminate value
- */
- function trimNull(value: string) {
- if (value.charCodeAt(value.length - 1) === 0) {
- return value.substring(0, value.length - 1);
- }
- return value;
- }
- // const STREAMING = 4294967295;
- /**
- * Read data for the given non-record variable
- */
- function nonRecord(buffer: IOBuffer, variable: { type: string, size: number }) {
- // variable type
- const type = str2num(variable.type);
- // size of the data
- const size = variable.size / num2bytes(type);
- // iterates over the data
- const data = new Array(size);
- for (let i = 0; i < size; i++) {
- data[i] = readType(buffer, type, 1);
- }
- return data;
- }
- /**
- * Read data for the given record variable
- */
- function record(buffer: IOBuffer, variable: { type: string, size: number }, recordDimension: NetCDFRecordDimension) {
- // variable type
- const type = str2num(variable.type);
- const width = variable.size ? variable.size / num2bytes(type) : 1;
- // size of the data
- // TODO streaming data
- const size = recordDimension.length;
- // iterates over the data
- const data = new Array(size);
- const step = recordDimension.recordStep;
- for (let i = 0; i < size; i++) {
- const currentOffset = buffer.offset;
- data[i] = readType(buffer, type, width);
- buffer.seek(currentOffset + step!);
- }
- return data;
- }
- // Grammar constants
- const ZERO = 0;
- const NC_DIMENSION = 10;
- const NC_VARIABLE = 11;
- const NC_ATTRIBUTE = 12;
- /**
- * Read the header of the file
- * Returns object with the fields:
- * - `recordDimension`: Number with the length of record dimension
- * - `dimensions`: List of dimensions
- * - `globalAttributes`: List of global attributes
- * - `variables`: List of variables
- */
- function header(buffer: IOBuffer, version: number) {
- // Length of record dimension
- // sum of the varSize's of all the record variables.
- const header: Partial<NetCDFHeader> = { recordDimension: { length: buffer.readUint32() } };
- // Version
- header.version = version;
- // List of dimensions
- const dimList = dimensionsList(buffer) as { dimensions: NetCDFDimension[], recordId: number, recordName: string };
- header.recordDimension!.id = dimList.recordId;
- header.recordDimension!.name = dimList.recordName;
- header.dimensions = dimList.dimensions;
- // List of global attributes
- header.globalAttributes = attributesList(buffer);
- // List of variables
- const variables = variablesList(buffer, dimList.recordId, version) as { variables: any[], recordStep: number };
- header.variables = variables.variables;
- header.recordDimension!.recordStep = variables.recordStep;
- return header;
- }
- /**
- * List of dimensions
- */
- function dimensionsList(buffer: IOBuffer) {
- let dimensions: NetCDFDimension[], recordId, recordName;
- const dimList = buffer.readUint32();
- if (dimList === ZERO) {
- notNetcdf((buffer.readUint32() !== ZERO), 'wrong empty tag for list of dimensions');
- return [];
- } else {
- notNetcdf((dimList !== NC_DIMENSION), 'wrong tag for list of dimensions');
- // Length of dimensions
- const dimensionSize = buffer.readUint32();
- dimensions = new Array(dimensionSize);
- for (let dim = 0; dim < dimensionSize; dim++) {
- // Read name
- const name = readName(buffer);
- // Read dimension size
- const size = buffer.readUint32();
- if (size === 0) {
- recordId = dim;
- recordName = name;
- }
- dimensions[dim] = {
- name: name,
- size: size
- };
- }
- return {
- dimensions: dimensions,
- recordId: recordId,
- recordName: recordName
- };
- }
- }
- /**
- * List of attributes
- */
- function attributesList(buffer: IOBuffer) {
- let attributes: { name: string, type: ReturnType<typeof num2str>, value: any }[];
- const gAttList = buffer.readUint32();
- if (gAttList === ZERO) {
- notNetcdf((buffer.readUint32() !== ZERO), 'wrong empty tag for list of attributes');
- return [];
- } else {
- notNetcdf((gAttList !== NC_ATTRIBUTE), 'wrong tag for list of attributes');
- // Length of attributes
- const attributeSize = buffer.readUint32();
- attributes = new Array(attributeSize);
- for (let gAtt = 0; gAtt < attributeSize; gAtt++) {
- // Read name
- const name = readName(buffer);
- // Read type
- const type = buffer.readUint32();
- notNetcdf(((type < 1) || (type > 6)), 'non valid type ' + type);
- // Read attribute
- const size = buffer.readUint32();
- const value = readType(buffer, type, size);
- // Apply padding
- padding(buffer);
- attributes[gAtt] = {
- name: name,
- type: num2str(type),
- value: value
- };
- }
- }
- return attributes;
- }
- /**
- * List of variables
- */
- function variablesList(buffer: IOBuffer, recordId: number, version: number) {
- const varList = buffer.readUint32();
- let recordStep = 0;
- let variables;
- if (varList === ZERO) {
- notNetcdf(
- (buffer.readUint32() !== ZERO),
- 'wrong empty tag for list of variables'
- );
- return [];
- } else {
- notNetcdf((varList !== NC_VARIABLE), 'wrong tag for list of variables');
- // Length of variables
- const variableSize = buffer.readUint32();
- variables = new Array(variableSize);
- for (let v = 0; v < variableSize; v++) {
- // Read name
- const name = readName(buffer);
- // Read dimensionality of the variable
- const dimensionality = buffer.readUint32();
- // Index into the list of dimensions
- const dimensionsIds = new Array(dimensionality);
- for (let dim = 0; dim < dimensionality; dim++) {
- dimensionsIds[dim] = buffer.readUint32();
- }
- // Read variables size
- const attributes = attributesList(buffer);
- // Read type
- const type = buffer.readUint32();
- notNetcdf(((type < 1) && (type > 6)), 'non valid type ' + type);
- // Read variable size
- // The 32-bit varSize field is not large enough to contain the
- // size of variables that require more than 2^32 - 4 bytes,
- // so 2^32 - 1 is used in the varSize field for such variables.
- const varSize = buffer.readUint32();
- // Read offset
- let offset = buffer.readUint32();
- if (version === 2) {
- notNetcdf((offset > 0), 'offsets larger than 4GB not supported');
- offset = buffer.readUint32();
- }
- // Count amount of record variables
- if (dimensionsIds[0] === recordId) {
- recordStep += varSize;
- }
- variables[v] = {
- name: name,
- dimensions: dimensionsIds,
- attributes: attributes,
- type: num2str(type),
- size: varSize,
- offset: offset,
- record: (dimensionsIds[0] === recordId)
- };
- }
- }
- return {
- variables: variables,
- recordStep: recordStep
- };
- }
- /**
- * Reads a NetCDF v3.x file
- * https://www.unidata.ucar.edu/software/netcdf/docs/file_format_specifications.html
- */
- export class NetcdfReader {
- header: Partial<NetCDFHeader>;
- buffer: IOBuffer;
- constructor(data: ArrayBuffer) {
- const buffer = new IOBuffer(data);
- buffer.setBigEndian();
- // Validate that it's a NetCDF file
- notNetcdf((buffer.readChars(3) !== 'CDF'), 'should start with CDF');
- // Check the NetCDF format
- const version = buffer.readByte();
- notNetcdf((version > 2), 'unknown version');
- // Read the header
- this.header = header(buffer, version);
- this.buffer = buffer;
- }
- /**
- * Version for the NetCDF format
- */
- get version() {
- if (this.header.version === 1) {
- return 'classic format';
- } else {
- return '64-bit offset format';
- }
- }
- get recordDimension() {
- return this.header.recordDimension;
- }
- get dimensions() {
- return this.header.dimensions;
- }
- get globalAttributes() {
- return this.header.globalAttributes;
- }
- get variables() {
- return this.header.variables;
- }
- /**
- * Checks if a variable is available
- * @param {string|object} variableName - Name of the variable to check
- * @return {Boolean} - Variable existence
- */
- hasDataVariable(variableName: string) {
- return this.header.variables && this.header.variables.findIndex(val => val.name === variableName) !== -1;
- }
- /**
- * Retrieves the data for a given variable
- * @param {string|object} variableName - Name of the variable to search or variable object
- * @return {Array} - List with the variable values
- */
- getDataVariable(variableName: string | NetCDFVariable) {
- let variable: NetCDFVariable | undefined;
- if (typeof variableName === 'string') {
- // search the variable
- variable = this.header.variables?.find((val) => val.name === variableName);
- } else {
- variable = variableName;
- }
- // throws if variable not found
- if (variable === undefined) throw new Error('variable not found');
- // go to the offset position
- this.buffer.seek(variable.offset);
- if (variable.record) {
- // record variable case
- return record(this.buffer, variable, this.header.recordDimension!);
- } else {
- // non-record variable case
- return nonRecord(this.buffer, variable);
- }
- }
- }
|