libvroom

libvroom

Functions

Name
AlignedBuffer transcode_windows1252_to_utf8(const uint8_t * data, size_t size)
AlignedBuffer transcode_to_utf8(const uint8_t * data, size_t size, CharEncoding enc, size_t bom_length)
std::vector< std::string > simd_supported_targets()
std::string simd_best_target()
AlignedBuffer read_stdin_to_ptr(size_t padding)
std::shared_ptr< Table > read_csv_to_table(const std::string & path, const CsvOptions & opts)
CharEncoding parse_encoding_name(std::string_view name)
AlignedBuffer load_file_to_ptr(const std::string & filename, size_t padding)
bool has_windows1252_bytes(const uint8_t * data, size_t size)
const char * error_severity_to_string(ErrorSeverity severity)
const char * error_mode_to_string(ErrorMode mode)
const char * error_code_to_string(ErrorCode code)
const char * encoding_to_string(CharEncoding enc)
size_t encode_utf8(uint32_t cp, uint8_t * out)
int detect_escape_pattern(const uint8_t * buf, size_t len, char quote_char, char escape_char)
EncodingResult detect_encoding(const uint8_t * data, size_t size)
ConversionResult convert_csv_to_parquet(const VroomOptions & options, ProgressCallback progress)

Attributes

Name
const uint32_t[32] windows1252_to_unicode
constexpr double ESCAPE_PATTERN_MATCH_BOOST
Score boost for dialects matching detected escape patterns (e.g., ” or ““) Applied when there’s a clear escape pattern signal in the data.
constexpr double DOUBLE_QUOTE_ESCAPE_BOOST
Smaller boost for double-quote escaping when explicitly detected Used to slightly prefer RFC 4180 style when evidence is present.

Functions Documentation

function transcode_windows1252_to_utf8

static AlignedBuffer transcode_windows1252_to_utf8(
    const uint8_t * data,
    size_t size
)

function transcode_to_utf8

AlignedBuffer transcode_to_utf8(
    const uint8_t * data,
    size_t size,
    CharEncoding enc,
    size_t bom_length
)

function simd_supported_targets

std::vector< std::string > simd_supported_targets()

function simd_best_target

std::string simd_best_target()

function read_stdin_to_ptr

AlignedBuffer read_stdin_to_ptr(
    size_t padding
)

function read_csv_to_table

std::shared_ptr< Table > read_csv_to_table(
    const std::string & path,
    const CsvOptions & opts
)

function parse_encoding_name

CharEncoding parse_encoding_name(
    std::string_view name
)

function load_file_to_ptr

AlignedBuffer load_file_to_ptr(
    const std::string & filename,
    size_t padding
)

function has_windows1252_bytes

static bool has_windows1252_bytes(
    const uint8_t * data,
    size_t size
)

function error_severity_to_string

const char * error_severity_to_string(
    ErrorSeverity severity
)

function error_mode_to_string

const char * error_mode_to_string(
    ErrorMode mode
)

function error_code_to_string

const char * error_code_to_string(
    ErrorCode code
)

function encoding_to_string

const char * encoding_to_string(
    CharEncoding enc
)

function encode_utf8

static size_t encode_utf8(
    uint32_t cp,
    uint8_t * out
)

function detect_escape_pattern

static int detect_escape_pattern(
    const uint8_t * buf,
    size_t len,
    char quote_char,
    char escape_char
)

function detect_encoding

EncodingResult detect_encoding(
    const uint8_t * data,
    size_t size
)

function convert_csv_to_parquet

ConversionResult convert_csv_to_parquet(
    const VroomOptions & options,
    ProgressCallback progress
)

Attributes Documentation

variable windows1252_to_unicode

static const uint32_t[32] windows1252_to_unicode;

variable ESCAPE_PATTERN_MATCH_BOOST

constexpr double ESCAPE_PATTERN_MATCH_BOOST = 1.2;

Score boost for dialects matching detected escape patterns (e.g., ” or ““) Applied when there’s a clear escape pattern signal in the data.

variable DOUBLE_QUOTE_ESCAPE_BOOST

constexpr double DOUBLE_QUOTE_ESCAPE_BOOST = 1.1;

Smaller boost for double-quote escaping when explicitly detected Used to slightly prefer RFC 4180 style when evidence is present.


Updated on 2026-02-16 at 19:19:38 +0000