|
| 1 | +// Licensed to the Apache Software Foundation (ASF) under one |
| 2 | +// or more contributor license agreements. See the NOTICE file |
| 3 | +// distributed with this work for additional information |
| 4 | +// regarding copyright ownership. The ASF licenses this file |
| 5 | +// to you under the Apache License, Version 2.0 (the |
| 6 | +// "License"); you may not use this file except in compliance |
| 7 | +// with the License. You may obtain a copy of the License at |
| 8 | +// |
| 9 | +// http://www.apache.org/licenses/LICENSE-2.0 |
| 10 | +// |
| 11 | +// Unless required by applicable law or agreed to in writing, software |
| 12 | +// distributed under the License is distributed on an "AS IS" BASIS, |
| 13 | +// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. |
| 14 | +// See the License for the specific language governing permissions and |
| 15 | +// limitations under the License. |
| 16 | + |
| 17 | +// Package parquet provides an implementation of Apache Parquet for Go. |
| 18 | +// |
| 19 | +// Apache Parquet is an open-source columnar data storage format using the record |
| 20 | +// shredding and assembly algorithm to accomodate complex data structures which |
| 21 | +// can then be used to efficiently store the data. |
| 22 | +// |
| 23 | +// This implementation is a native go implementation for reading and writing the |
| 24 | +// parquet file format. |
| 25 | +// |
| 26 | +// Install |
| 27 | +// |
| 28 | +// You can download the library via: |
| 29 | +// go get -u github.com/apache/arrow/go/parquet |
| 30 | +// |
| 31 | +// In addition, two cli utilities are provided: |
| 32 | +// go install github.factset.com/mtopol/parquet-go/cmd/parquet_reader |
| 33 | +// go install github.factset.com/mtopol/parquet-go/cmd/parquet_schema |
| 34 | +// |
| 35 | +// Modules |
| 36 | +// |
| 37 | +// This top level parquet package contains the basic common types and reader/writer |
| 38 | +// properties along with some utilities that are used throughout the other modules. |
| 39 | +// |
| 40 | +// The file module contains the functions for directly reading/writing parquet files |
| 41 | +// including Column Readers and Column Writers. |
| 42 | +// |
| 43 | +// The metadata module contains the types for managing the lower level file/rowgroup/column |
| 44 | +// metadata inside of a ParquetFile including inspecting the statistics. |
| 45 | +// |
| 46 | +// The pqarrow module contains helper functions and types for converting directly |
| 47 | +// between Parquet and Apache Arrow formats. |
| 48 | +// |
| 49 | +// The schema module contains the types for manipulating / inspecting / creating |
| 50 | +// parquet file schemas. |
| 51 | +// |
| 52 | +// Primitive Types |
| 53 | +// |
| 54 | +// The Parquet Primitive Types and their corresponding Go types are Boolean (bool), |
| 55 | +// Int32 (int32), Int64 (int64), Int96 (parquet.Int96), Float (float32), Double (float64), |
| 56 | +// ByteArray (parquet.ByteArray) and FixedLenByteArray (parquet.FixedLenByteArray). |
| 57 | +// |
| 58 | +// Encodings |
| 59 | +// |
| 60 | +// The encoding types supported in this package are: |
| 61 | +// Plain, Plain/RLE Dictionary, Delta Binary Packed (only integer types), Delta Byte Array |
| 62 | +// (only ByteArray), Delta Length Byte Array (only ByteArray) |
| 63 | +// |
| 64 | +// Tip: Some platforms don't necessarily support all kinds of encodings. If you're not |
| 65 | +// sure what to use, just use Plain and Dictionary encoding. |
| 66 | +package parquet |
| 67 | + |
| 68 | +//go:generate thrift -o internal -r --gen go ../../cpp/src/parquet/parquet.thrift |
0 commit comments