diff --git a/.gitignore b/.gitignore index f8423d9..a9dd7ea 100644 --- a/.gitignore +++ b/.gitignore @@ -3,3 +3,4 @@ package-lock.json coverage dist *.tgz +example.parquet diff --git a/README.md b/README.md index 40d7533..b917770 100644 --- a/README.md +++ b/README.md @@ -16,9 +16,10 @@ Dependency free since 2023! ## Features - Designed to work with huge ML datasets (things like [starcoder](https://huggingface.co/datasets/bigcode/starcoderdata)) -- Loads metadata separately from data +- Can load metadata separately from data - Data can be filtered by row and column ranges - Only fetches the data needed +- Written in JavaScript, checked with TypeScript - Fast data loading for large scale ML applications - Bring data visualization closer to the user, in the browser @@ -50,7 +51,7 @@ const { parquetMetadata } = await import('hyparquet') const fs = await import('fs') const buffer = fs.readFileSync('example.parquet') -const arrayBuffer = buffer.buffer.slice(buffer.byteOffset, buffer.byteOffset + buffer.byteLength) +const arrayBuffer = new Uint8Array(buffer).buffer const metadata = parquetMetadata(arrayBuffer) ``` diff --git a/package.json b/package.json index f51c0b1..cea5a62 100644 --- a/package.json +++ b/package.json @@ -1,6 +1,6 @@ { "name": "hyparquet", - "version": "0.1.6", + "version": "0.2.0", "description": "parquet file parser for javascript", "keywords": [ "parquet",