blob: a5a535db6e6ac4c24e63a34b905cf45d220e9b9b [file] [log] [blame]
// Licensed to the Apache Software Foundation (ASF) under one
// or more contributor license agreements. See the NOTICE file
// distributed with this work for additional information
// regarding copyright ownership. The ASF licenses this file
// to you under the Apache License, Version 2.0 (the
// "License"); you may not use this file except in compliance
// with the License. You may obtain a copy of the License at
//
// http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.
// Command arrow-ls displays the listing of an Arrow file.
//
// Examples:
//
// $> arrow-ls ./testdata/primitives.data
// version: V4
// schema:
// fields: 11
// - bools: type=bool, nullable
// - int8s: type=int8, nullable
// - int16s: type=int16, nullable
// - int32s: type=int32, nullable
// - int64s: type=int64, nullable
// - uint8s: type=uint8, nullable
// - uint16s: type=uint16, nullable
// - uint32s: type=uint32, nullable
// - uint64s: type=uint64, nullable
// - float32s: type=float32, nullable
// - float64s: type=float64, nullable
// records: 3
//
// $> gen-arrow-stream | arrow-ls
// schema:
// fields: 11
// - bools: type=bool, nullable
// - int8s: type=int8, nullable
// - int16s: type=int16, nullable
// - int32s: type=int32, nullable
// - int64s: type=int64, nullable
// - uint8s: type=uint8, nullable
// - uint16s: type=uint16, nullable
// - uint32s: type=uint32, nullable
// - uint64s: type=uint64, nullable
// - float32s: type=float32, nullable
// - float64s: type=float64, nullable
// records: 3
package main // import "github.com/apache/arrow/go/v6/arrow/ipc/cmd/arrow-ls"
import (
"bytes"
"flag"
"fmt"
"io"
"log"
"os"
"github.com/apache/arrow/go/v6/arrow/ipc"
"github.com/apache/arrow/go/v6/arrow/memory"
"golang.org/x/xerrors"
)
func main() {
log.SetPrefix("arrow-ls: ")
log.SetFlags(0)
flag.Parse()
var err error
switch flag.NArg() {
case 0:
err = processStream(os.Stdout, os.Stdin)
default:
err = processFiles(os.Stdout, flag.Args())
}
if err != nil {
log.Fatal(err)
}
}
func processStream(w io.Writer, rin io.Reader) error {
mem := memory.NewGoAllocator()
for {
r, err := ipc.NewReader(rin, ipc.WithAllocator(mem))
if err != nil {
if xerrors.Is(err, io.EOF) {
return nil
}
return err
}
fmt.Fprintf(w, "%v\n", r.Schema())
nrecs := 0
for r.Next() {
nrecs++
}
fmt.Fprintf(w, "records: %d\n", nrecs)
r.Release()
}
return nil
}
func processFiles(w io.Writer, names []string) error {
for _, name := range names {
err := processFile(w, name)
if err != nil {
return err
}
}
return nil
}
func processFile(w io.Writer, fname string) error {
f, err := os.Open(fname)
if err != nil {
return err
}
defer f.Close()
hdr := make([]byte, len(ipc.Magic))
_, err = io.ReadFull(f, hdr)
if err != nil {
return xerrors.Errorf("could not read file header: %w", err)
}
f.Seek(0, io.SeekStart)
if !bytes.Equal(hdr, ipc.Magic) {
// try as a stream.
return processStream(w, f)
}
mem := memory.NewGoAllocator()
r, err := ipc.NewFileReader(f, ipc.WithAllocator(mem))
if err != nil {
if xerrors.Is(err, io.EOF) {
return nil
}
return err
}
defer r.Close()
fmt.Fprintf(w, "version: %v\n", r.Version())
fmt.Fprintf(w, "%v\n", r.Schema())
fmt.Fprintf(w, "records: %d\n", r.NumRecords())
return nil
}
func init() {
flag.Usage = func() {
fmt.Fprintf(os.Stderr, `Command arrow-ls displays the listing of an Arrow file.
Usage: arrow-ls [OPTIONS] [FILE1 [FILE2 [...]]]
Examples:
$> arrow-ls ./testdata/primitives.data
version: V4
schema:
fields: 11
- bools: type=bool, nullable
- int8s: type=int8, nullable
- int16s: type=int16, nullable
- int32s: type=int32, nullable
- int64s: type=int64, nullable
- uint8s: type=uint8, nullable
- uint16s: type=uint16, nullable
- uint32s: type=uint32, nullable
- uint64s: type=uint64, nullable
- float32s: type=float32, nullable
- float64s: type=float64, nullable
records: 3
$> gen-arrow-stream | arrow-ls
schema:
fields: 11
- bools: type=bool, nullable
- int8s: type=int8, nullable
- int16s: type=int16, nullable
- int32s: type=int32, nullable
- int64s: type=int64, nullable
- uint8s: type=uint8, nullable
- uint16s: type=uint16, nullable
- uint32s: type=uint32, nullable
- uint64s: type=uint64, nullable
- float32s: type=float32, nullable
- float64s: type=float64, nullable
records: 3
`)
os.Exit(0)
}
}