12 std::cout <<
"\n=== Wavelet-based Chunking Demonstration ===\n";
15 std::vector<double> numeric_data = {1.0, 1.1, 1.2, 5.0, 5.1, 5.2, 2.0, 2.1, 2.2};
17 auto numeric_chunks = wavelet_numeric.
chunk(numeric_data);
20 std::string text =
"This is a test sentence. Another sentence here. And one more.";
21 std::vector<char> char_data(text.begin(), text.end());
23 auto text_chunks = wavelet_text.
chunk(char_data);
26 std::cout <<
"Numeric chunks: " << numeric_chunks.size() <<
"\n";
27 std::cout <<
"Text chunks: " << text_chunks.size() <<
"\n";
34 std::cout <<
"\n=== Mutual Information Chunking Demonstration ===\n";
37 std::vector<std::string> words = {
"the",
"quick",
"brown",
"fox",
"jumps",
38 "over",
"the",
"lazy",
"dog"};
40 auto word_chunks = mi_words.
chunk(words);
43 std::vector<uint8_t> binary_data = {0xFF, 0xFE, 0xFD, 0x00, 0x01, 0x02};
45 auto binary_chunks = mi_binary.
chunk(binary_data);
48 std::cout <<
"Word chunks: " << word_chunks.size() <<
"\n";
49 std::cout <<
"Binary chunks: " << binary_chunks.size() <<
"\n";
56 std::cout <<
"\n=== DTW-based Chunking Demonstration ===\n";
59 std::vector<float> time_series = {1.0f, 1.2f, 1.1f, 5.0f, 5.2f, 5.1f, 2.0f, 2.2f, 2.1f};
61 auto ts_chunks = dtw_numeric.
chunk(time_series);
64 std::vector<char> categorical = {
'A',
'A',
'B',
'B',
'C',
'C',
'A',
'B'};
66 auto cat_chunks = dtw_categorical.
chunk(categorical);
69 std::cout <<
"Time series chunks: " << ts_chunks.size() <<
"\n";
70 std::cout <<
"Categorical chunks: " << cat_chunks.size() <<
"\n";
Dynamic time warping based chunking for sequence alignment.
std::vector< std::vector< T > > chunk(const std::vector< T > &data) const
Chunk data based on DTW analysis.
Wavelet-based chunking strategy using signal processing principles.
std::vector< std::vector< T > > chunk(const std::vector< T > &data) const
Chunk data based on wavelet transform analysis.
void demonstrate_wavelet_chunking()
Demonstrate wavelet-based chunking with different data types.
void demonstrate_dtw_chunking()
Demonstrate DTW-based chunking.
void demonstrate_mutual_information_chunking()
Demonstrate mutual information based chunking.