import { parquetMetadata, toJson } from './src/hyparquet.js'
const dropzone = document.getElementById('dropzone')
const layout = document.getElementById('layout')
const metadata = document.getElementById('metadata')
const fileInput = document.getElementById('file-input')
dropzone.addEventListener('dragover', e => {
e.preventDefault()
e.dataTransfer.dropEffect = 'copy'
dropzone.classList.add('over')
})
dropzone.addEventListener('dragleave', () => {
dropzone.classList.remove('over')
})
dropzone.addEventListener('drop', e => {
e.preventDefault() // prevent dropped file from being "downloaded"
dropzone.classList.remove('over')
const { files, items } = e.dataTransfer
if (files.length > 0) {
const file = files[0]
processFile(file)
}
if (items.length > 0) {
const item = items[0]
if (item.kind === 'string') {
item.getAsString(str => {
if (str.startsWith('https')) {
processUrl(str)
}
})
}
}
})
function processUrl(url) {
fetch(url)
.then(response => response.arrayBuffer())
.then(arrayBuffer => renderSidebar(arrayBuffer, url))
.catch(e => {
dropzone.innerHTML = `${url}`
dropzone.innerHTML += `
Error fetching file\n${e}
`
})
}
function processFile(file) {
const reader = new FileReader()
reader.onload = e => {
try {
const arrayBuffer = e.target.result
renderSidebar(arrayBuffer, file.name)
} catch (e) {
dropzone.innerHTML = `${file.name}`
dropzone.innerHTML += `Error parsing file\n${e}
`
}
}
reader.onerror = e => {
console.error('Error reading file', e)
dropzone.innerText = `Error reading file\n${e.target.error}`
}
reader.readAsArrayBuffer(file)
}
function renderSidebar(asyncBuffer, name) {
layout.innerHTML = `${name}`
// render file layout
layout.appendChild(fileLayout(metadata, asyncBuffer))
// display metadata
metadata.innerHTML = ''
metadata.appendChild(fileMetadata(toJson(parquetMetadata(asyncBuffer))))
}
dropzone.addEventListener('click', () => {
fileInput.click()
})
fileInput.addEventListener('change', () => {
if (fileInput.files.length > 0) {
processFile(fileInput.files[0])
}
})
// Render file layout
function fileLayout(metadata, arrayBuffer) {
let html = 'File layout
'
html += cell('PAR1', 0, 4, 4) // magic number
for (const rowGroupIndex in metadata.row_groups) {
const rowGroup = metadata.row_groups[rowGroupIndex]
html += group(`Row group ${rowGroupIndex} (${rowGroup.total_byte_size} bytes)`)
for (const column of rowGroup.columns) {
const columnName = column.meta_data.path_in_schema.join('.')
let columnOffset = column.meta_data.dictionary_page_offset
if (!columnOffset || column.meta_data.data_page_offset < columnOffset) {
columnOffset = column.meta_data.data_page_offset
}
columnOffset = Number(columnOffset)
const bytes = column.meta_data.total_compressed_size
const end = columnOffset + bytes
html += cell(`Column ${columnName}`, columnOffset, bytes, end)
}
html += ''
}
const metadataStart = arrayBuffer.byteLength - metadata.metadata_length - 4
html += cell('Metadata', metadataStart, metadata.metadata_length, arrayBuffer.byteLength - 4)
html += cell('PAR1', arrayBuffer.byteLength - 4, 4, arrayBuffer.byteLength) // magic number
const div = document.createElement('div')
div.innerHTML = html
div.classList.add('collapsed') // start collapsed
div.children[0].addEventListener('click', () => {
div.classList.toggle('collapsed')
})
return div
}
function group(name) {
return `${name}`
}
function cell(name, start, bytes, end) {
return `
- start ${start}
- bytes ${bytes}
- end ${end}
`
}
// Render metadata
function fileMetadata(metadata) {
let html = '
Metadata
'
html += `
${JSON.stringify(metadata, null, 2)}`
const div = document.createElement('div')
div.innerHTML = html
div.classList.add('collapsed') // start collapsed
div.children[0].addEventListener('click', () => {
div.classList.toggle('collapsed')
})
return div
}