ocf

package
v2.21.0 Latest Latest
Warning

This package is not in the latest version of its module.

Go to latest
Published: Apr 23, 2024 License: MIT Imports: 13 Imported by: 8

Documentation

Overview

Package ocf implements encoding and decoding of Avro Object Container Files as defined by the Avro specification.

See the Avro specification for an understanding of Avro: http://avro.apache.org/docs/current/

Index

Examples

Constants

This section is empty.

Variables

View Source
var HeaderSchema = avro.MustParse(`{
	"type": "record", 
	"name": "org.apache.avro.file.Header",
	"fields": [
		{"name": "magic", "type": {"type": "fixed", "name": "Magic", "size": 4}},
		{"name": "meta", "type": {"type": "map", "values": "bytes"}},
		{"name": "sync", "type": {"type": "fixed", "name": "Sync", "size": 16}}
	]
}`)

HeaderSchema is the Avro schema of a container file header.

Functions

This section is empty.

Types

type Codec

type Codec interface {
	// Decode decodes the given bytes.
	Decode([]byte) ([]byte, error)
	// Encode encodes the given bytes.
	Encode([]byte) []byte
}

Codec represents a compression codec.

type CodecName

type CodecName string

CodecName represents a compression codec name.

const (
	Null      CodecName = "null"
	Deflate   CodecName = "deflate"
	Snappy    CodecName = "snappy"
	ZStandard CodecName = "zstandard"
)

Supported compression codecs.

type Decoder

type Decoder struct {
	// contains filtered or unexported fields
}

Decoder reads and decodes Avro values from a container file.

func NewDecoder

func NewDecoder(r io.Reader) (*Decoder, error)

NewDecoder returns a new decoder that reads from reader r.

Example
package main

import (
	"log"
	"os"

	"github.com/hamba/avro/v2/ocf"
)

func main() {
	type SimpleRecord struct {
		A int64  `avro:"a"`
		B string `avro:"b"`
	}

	f, err := os.Open("/your/avro/file.avro")
	if err != nil {
		log.Fatal(err)
	}
	defer f.Close()

	dec, err := ocf.NewDecoder(f)
	if err != nil {
		log.Fatal(err)
	}

	for dec.HasNext() {
		var record SimpleRecord
		err = dec.Decode(&record)
		if err != nil {
			log.Fatal(err)
		}

		// Do something with the data
	}

	if dec.Error() != nil {
		log.Fatal(err)
	}
}
Output:

func (*Decoder) Decode

func (d *Decoder) Decode(v any) error

Decode reads the next Avro encoded value from its input and stores it in the value pointed to by v.

func (*Decoder) Error

func (d *Decoder) Error() error

Error returns the last reader error.

func (*Decoder) HasNext

func (d *Decoder) HasNext() bool

HasNext determines if there is another value to read.

func (*Decoder) Metadata

func (d *Decoder) Metadata() map[string][]byte

Metadata returns the header metadata.

type DeflateCodec

type DeflateCodec struct {
	// contains filtered or unexported fields
}

DeflateCodec is a flate compression codec.

func (*DeflateCodec) Decode

func (c *DeflateCodec) Decode(b []byte) ([]byte, error)

Decode decodes the given bytes.

func (*DeflateCodec) Encode

func (c *DeflateCodec) Encode(b []byte) []byte

Encode encodes the given bytes.

type Encoder

type Encoder struct {
	// contains filtered or unexported fields
}

Encoder writes Avro container file to an output stream.

func NewEncoder

func NewEncoder(s string, w io.Writer, opts ...EncoderFunc) (*Encoder, error)

NewEncoder returns a new encoder that writes to w using schema s.

If the writer is an existing ocf file, it will append data using the existing schema.

Example
package main

import (
	"log"
	"os"

	"github.com/hamba/avro/v2/ocf"
)

func main() {
	schema := `{
	    "type": "record",
	    "name": "simple",
	    "namespace": "org.hamba.avro",
	    "fields" : [
	        {"name": "a", "type": "long"},
	        {"name": "b", "type": "string"}
	    ]
	}`

	type SimpleRecord struct {
		A int64  `avro:"a"`
		B string `avro:"b"`
	}

	f, err := os.Open("/your/avro/file.avro")
	if err != nil {
		log.Fatal(err)
	}
	defer f.Close()

	enc, err := ocf.NewEncoder(schema, f)
	if err != nil {
		log.Fatal(err)
	}

	var record SimpleRecord
	err = enc.Encode(record)
	if err != nil {
		log.Fatal(err)
	}

	if err := enc.Flush(); err != nil {
		log.Fatal(err)
	}

	if err := f.Sync(); err != nil {
		log.Fatal(err)
	}
}
Output:

func (*Encoder) Close

func (e *Encoder) Close() error

Close closes the encoder, flushing the writer.

func (*Encoder) Encode

func (e *Encoder) Encode(v any) error

Encode writes the Avro encoding of v to the stream.

func (*Encoder) Flush

func (e *Encoder) Flush() error

Flush flushes the underlying writer.

func (*Encoder) Write

func (e *Encoder) Write(p []byte) (n int, err error)

Write v to the internal buffer. This method skips the internal encoder and therefore the caller is responsible for encoding the bytes. No error will be thrown if the bytes does not conform to the schema given to NewEncoder, but the final ocf data will be corrupted.

type EncoderFunc

type EncoderFunc func(cfg *encoderConfig)

EncoderFunc represents an configuration function for Encoder.

func WithBlockLength

func WithBlockLength(length int) EncoderFunc

WithBlockLength sets the block length on the encoder.

func WithCodec

func WithCodec(codec CodecName) EncoderFunc

WithCodec sets the compression codec on the encoder.

func WithCompressionLevel

func WithCompressionLevel(compLvl int) EncoderFunc

WithCompressionLevel sets the compression codec to deflate and the compression level on the encoder.

func WithEncodingConfig added in v2.11.0

func WithEncodingConfig(wCfg avro.API) EncoderFunc

WithEncodingConfig sets the value encoder config on the OCF encoder.

func WithMetadata

func WithMetadata(meta map[string][]byte) EncoderFunc

WithMetadata sets the metadata on the encoder header.

func WithSyncBlock added in v2.2.0

func WithSyncBlock(sync [16]byte) EncoderFunc

WithSyncBlock sets the sync block.

type Header struct {
	Magic [4]byte           `avro:"magic"`
	Meta  map[string][]byte `avro:"meta"`
	Sync  [16]byte          `avro:"sync"`
}

Header represents an Avro container file header.

type NullCodec

type NullCodec struct{}

NullCodec is a no op codec.

func (*NullCodec) Decode

func (*NullCodec) Decode(b []byte) ([]byte, error)

Decode decodes the given bytes.

func (*NullCodec) Encode

func (*NullCodec) Encode(b []byte) []byte

Encode encodes the given bytes.

type SnappyCodec

type SnappyCodec struct{}

SnappyCodec is a snappy compression codec.

func (*SnappyCodec) Decode

func (*SnappyCodec) Decode(b []byte) ([]byte, error)

Decode decodes the given bytes.

func (*SnappyCodec) Encode

func (*SnappyCodec) Encode(b []byte) []byte

Encode encodes the given bytes.

type ZStandardCodec added in v2.19.0

type ZStandardCodec struct{}

ZStandardCodec is a zstandard compression codec.

func (*ZStandardCodec) Decode added in v2.19.0

func (*ZStandardCodec) Decode(b []byte) ([]byte, error)

Decode decodes the given bytes.

func (*ZStandardCodec) Encode added in v2.19.0

func (*ZStandardCodec) Encode(b []byte) []byte

Encode encodes the given bytes.

Jump to

Keyboard shortcuts

? : This menu
/ : Search site
f or F : Jump to
y or Y : Canonical URL