tinyllama.cpp/gguf__parser_8h_source.html

#pragma once


#include <cstddef>

#include <fstream>

#include <map>

#include <string>

#include <vector>


#include "gguf_structs.h"


constexpr uint32_t GGUF_MAGIC = 0x46554747;


constexpr uint64_t GGUF_DEFAULT_ALIGNMENT = 32;

constexpr uint32_t GGUF_MAX_TENSOR_DIMS = 4;

constexpr uint64_t GGUF_STRING_MAX_LENGTH = 1ull << 30;

constexpr float GGUF_EPSILON = 1e-10f;

constexpr float GGUF_SMALL_VAL = 1e-6f;

constexpr size_t GGML_QK_K = 256;

constexpr size_t GGML_QK8_0 = 32;

constexpr size_t GGML_Q4K_BLOCK_SIZE = 32;

constexpr size_t GGML_Q6K_BLOCK_SIZE = 256;

constexpr float TENSOR_SCALE_MAX = 1000.0f;

constexpr float TENSOR_SCALE_MIN = -1000.0f;

constexpr float Q4K_SCALE_FACTOR = 15.0f;

constexpr float Q6K_SCALE_FACTOR = 31.0f;

constexpr float Q8K_SCALE_FACTOR = 127.0f;

constexpr int8_t Q4K_OFFSET = 8;

constexpr int8_t Q6K_OFFSET = 32;

template <typename T>

void read_raw(std::ifstream& file, T& dest);


std::string read_gguf_string(std::ifstream& file);


GGUFData load_gguf_meta(const std::string& filename, bool use_mmap);

GGUF_MAGIC
constexpr uint32_t GGUF_MAGIC
GGUF magic number that identifies the file format Spells "GGUF" in ASCII (0x47475546)
Definition gguf_parser.h:24

TENSOR_SCALE_MAX
constexpr float TENSOR_SCALE_MAX
Constants for tensor value validation.
Definition gguf_parser.h:50

Q4K_OFFSET
constexpr int8_t Q4K_OFFSET
Offset values for quantization methods.
Definition gguf_parser.h:63

Q6K_OFFSET
constexpr int8_t Q6K_OFFSET
Definition gguf_parser.h:64

GGML_Q4K_BLOCK_SIZE
constexpr size_t GGML_Q4K_BLOCK_SIZE
Definition gguf_parser.h:44

Q8K_SCALE_FACTOR
constexpr float Q8K_SCALE_FACTOR
Definition gguf_parser.h:58

GGML_Q6K_BLOCK_SIZE
constexpr size_t GGML_Q6K_BLOCK_SIZE
Definition gguf_parser.h:45

Q4K_SCALE_FACTOR
constexpr float Q4K_SCALE_FACTOR
Scale factors for different quantization methods.
Definition gguf_parser.h:56

read_raw
void read_raw(std::ifstream &file, T &dest)
Reads raw binary data from a file stream.
Definition gguf_parser.cpp:62

GGUF_MAX_TENSOR_DIMS
constexpr uint32_t GGUF_MAX_TENSOR_DIMS
Definition gguf_parser.h:30

TENSOR_SCALE_MIN
constexpr float TENSOR_SCALE_MIN
Definition gguf_parser.h:51

Q6K_SCALE_FACTOR
constexpr float Q6K_SCALE_FACTOR
Definition gguf_parser.h:57

GGUF_EPSILON
constexpr float GGUF_EPSILON
Constants for numeric stability in calculations.
Definition gguf_parser.h:36

GGUF_STRING_MAX_LENGTH
constexpr uint64_t GGUF_STRING_MAX_LENGTH
Definition gguf_parser.h:31

GGML_QK8_0
constexpr size_t GGML_QK8_0
Definition gguf_parser.h:43

GGML_QK_K
constexpr size_t GGML_QK_K
Block size constants for different quantization formats.
Definition gguf_parser.h:42

GGUF_SMALL_VAL
constexpr float GGUF_SMALL_VAL
Definition gguf_parser.h:37

GGUF_DEFAULT_ALIGNMENT
constexpr uint64_t GGUF_DEFAULT_ALIGNMENT
Constants for GGUF file parsing and validation.
Definition gguf_parser.h:29

load_gguf_meta
GGUFData load_gguf_meta(const std::string &filename, bool use_mmap)
Loads GGUF metadata and optionally memory-maps tensor data.
Definition gguf_parser.cpp:123

read_gguf_string
std::string read_gguf_string(std::ifstream &file)
Reads a string from a GGUF format file.
Definition gguf_parser.cpp:82

gguf_structs.h
Data structures for GGUF (GPT-Generated Unified Format) file format.

GGUFData
Complete representation of a GGUF file's contents.
Definition gguf_structs.h:80