1 /////////////////////////////////////////////////////////////////////////////// 2 // 3 /// \file stream_encoder.c 4 /// \brief Encodes .xz Streams 5 // 6 // Author: Lasse Collin 7 // 8 // This file has been put into the public domain. 9 // You can do whatever you want with this file. 10 // 11 /////////////////////////////////////////////////////////////////////////////// 12 13 #include "block_encoder.h" 14 #include "index_encoder.h" 15 16 17 typedef struct { 18 enum { 19 SEQ_STREAM_HEADER, 20 SEQ_BLOCK_INIT, 21 SEQ_BLOCK_HEADER, 22 SEQ_BLOCK_ENCODE, 23 SEQ_INDEX_ENCODE, 24 SEQ_STREAM_FOOTER, 25 } sequence; 26 27 /// True if Block encoder has been initialized by 28 /// stream_encoder_init() or stream_encoder_update() 29 /// and thus doesn't need to be initialized in stream_encode(). 30 bool block_encoder_is_initialized; 31 32 /// Block 33 lzma_next_coder block_encoder; 34 35 /// Options for the Block encoder 36 lzma_block block_options; 37 38 /// The filter chain currently in use 39 lzma_filter filters[LZMA_FILTERS_MAX + 1]; 40 41 /// Index encoder. This is separate from Block encoder, because this 42 /// doesn't take much memory, and when encoding multiple Streams 43 /// with the same encoding options we avoid reallocating memory. 44 lzma_next_coder index_encoder; 45 46 /// Index to hold sizes of the Blocks 47 lzma_index *index; 48 49 /// Read position in buffer[] 50 size_t buffer_pos; 51 52 /// Total number of bytes in buffer[] 53 size_t buffer_size; 54 55 /// Buffer to hold Stream Header, Block Header, and Stream Footer. 56 /// Block Header has biggest maximum size. 57 uint8_t buffer[LZMA_BLOCK_HEADER_SIZE_MAX]; 58 } lzma_stream_coder; 59 60 61 static lzma_ret 62 block_encoder_init(lzma_stream_coder *coder, const lzma_allocator *allocator) 63 { 64 // Prepare the Block options. Even though Block encoder doesn't need 65 // compressed_size, uncompressed_size, and header_size to be 66 // initialized, it is a good idea to do it here, because this way 67 // we catch if someone gave us Filter ID that cannot be used in 68 // Blocks/Streams. 69 coder->block_options.compressed_size = LZMA_VLI_UNKNOWN; 70 coder->block_options.uncompressed_size = LZMA_VLI_UNKNOWN; 71 72 return_if_error(lzma_block_header_size(&coder->block_options)); 73 74 // Initialize the actual Block encoder. 75 return lzma_block_encoder_init(&coder->block_encoder, allocator, 76 &coder->block_options); 77 } 78 79 80 static lzma_ret 81 stream_encode(void *coder_ptr, const lzma_allocator *allocator, 82 const uint8_t *restrict in, size_t *restrict in_pos, 83 size_t in_size, uint8_t *restrict out, 84 size_t *restrict out_pos, size_t out_size, lzma_action action) 85 { 86 lzma_stream_coder *coder = coder_ptr; 87 88 // Main loop 89 while (*out_pos < out_size) 90 switch (coder->sequence) { 91 case SEQ_STREAM_HEADER: 92 case SEQ_BLOCK_HEADER: 93 case SEQ_STREAM_FOOTER: 94 lzma_bufcpy(coder->buffer, &coder->buffer_pos, 95 coder->buffer_size, out, out_pos, out_size); 96 if (coder->buffer_pos < coder->buffer_size) 97 return LZMA_OK; 98 99 if (coder->sequence == SEQ_STREAM_FOOTER) 100 return LZMA_STREAM_END; 101 102 coder->buffer_pos = 0; 103 ++coder->sequence; 104 break; 105 106 case SEQ_BLOCK_INIT: { 107 if (*in_pos == in_size) { 108 // If we are requested to flush or finish the current 109 // Block, return LZMA_STREAM_END immediately since 110 // there's nothing to do. 111 if (action != LZMA_FINISH) 112 return action == LZMA_RUN 113 ? LZMA_OK : LZMA_STREAM_END; 114 115 // The application had used LZMA_FULL_FLUSH to finish 116 // the previous Block, but now wants to finish without 117 // encoding new data, or it is simply creating an 118 // empty Stream with no Blocks. 119 // 120 // Initialize the Index encoder, and continue to 121 // actually encoding the Index. 122 return_if_error(lzma_index_encoder_init( 123 &coder->index_encoder, allocator, 124 coder->index)); 125 coder->sequence = SEQ_INDEX_ENCODE; 126 break; 127 } 128 129 // Initialize the Block encoder unless it was already 130 // initialized by stream_encoder_init() or 131 // stream_encoder_update(). 132 if (!coder->block_encoder_is_initialized) 133 return_if_error(block_encoder_init(coder, allocator)); 134 135 // Make it false so that we don't skip the initialization 136 // with the next Block. 137 coder->block_encoder_is_initialized = false; 138 139 // Encode the Block Header. This shouldn't fail since we have 140 // already initialized the Block encoder. 141 if (lzma_block_header_encode(&coder->block_options, 142 coder->buffer) != LZMA_OK) 143 return LZMA_PROG_ERROR; 144 145 coder->buffer_size = coder->block_options.header_size; 146 coder->sequence = SEQ_BLOCK_HEADER; 147 break; 148 } 149 150 case SEQ_BLOCK_ENCODE: { 151 static const lzma_action convert[LZMA_ACTION_MAX + 1] = { 152 LZMA_RUN, 153 LZMA_SYNC_FLUSH, 154 LZMA_FINISH, 155 LZMA_FINISH, 156 LZMA_FINISH, 157 }; 158 159 const lzma_ret ret = coder->block_encoder.code( 160 coder->block_encoder.coder, allocator, 161 in, in_pos, in_size, 162 out, out_pos, out_size, convert[action]); 163 if (ret != LZMA_STREAM_END || action == LZMA_SYNC_FLUSH) 164 return ret; 165 166 // Add a new Index Record. 167 const lzma_vli unpadded_size = lzma_block_unpadded_size( 168 &coder->block_options); 169 assert(unpadded_size != 0); 170 return_if_error(lzma_index_append(coder->index, allocator, 171 unpadded_size, 172 coder->block_options.uncompressed_size)); 173 174 coder->sequence = SEQ_BLOCK_INIT; 175 break; 176 } 177 178 case SEQ_INDEX_ENCODE: { 179 // Call the Index encoder. It doesn't take any input, so 180 // those pointers can be NULL. 181 const lzma_ret ret = coder->index_encoder.code( 182 coder->index_encoder.coder, allocator, 183 NULL, NULL, 0, 184 out, out_pos, out_size, LZMA_RUN); 185 if (ret != LZMA_STREAM_END) 186 return ret; 187 188 // Encode the Stream Footer into coder->buffer. 189 const lzma_stream_flags stream_flags = { 190 .version = 0, 191 .backward_size = lzma_index_size(coder->index), 192 .check = coder->block_options.check, 193 }; 194 195 if (lzma_stream_footer_encode(&stream_flags, coder->buffer) 196 != LZMA_OK) 197 return LZMA_PROG_ERROR; 198 199 coder->buffer_size = LZMA_STREAM_HEADER_SIZE; 200 coder->sequence = SEQ_STREAM_FOOTER; 201 break; 202 } 203 204 default: 205 assert(0); 206 return LZMA_PROG_ERROR; 207 } 208 209 return LZMA_OK; 210 } 211 212 213 static void 214 stream_encoder_end(void *coder_ptr, const lzma_allocator *allocator) 215 { 216 lzma_stream_coder *coder = coder_ptr; 217 218 lzma_next_end(&coder->block_encoder, allocator); 219 lzma_next_end(&coder->index_encoder, allocator); 220 lzma_index_end(coder->index, allocator); 221 222 for (size_t i = 0; coder->filters[i].id != LZMA_VLI_UNKNOWN; ++i) 223 lzma_free(coder->filters[i].options, allocator); 224 225 lzma_free(coder, allocator); 226 return; 227 } 228 229 230 static lzma_ret 231 stream_encoder_update(void *coder_ptr, const lzma_allocator *allocator, 232 const lzma_filter *filters, 233 const lzma_filter *reversed_filters) 234 { 235 lzma_stream_coder *coder = coder_ptr; 236 lzma_ret ret; 237 238 // Make a copy to a temporary buffer first. This way it is easier 239 // to keep the encoder state unchanged if an error occurs with 240 // lzma_filters_copy(). 241 lzma_filter temp[LZMA_FILTERS_MAX + 1]; 242 return_if_error(lzma_filters_copy(filters, temp, allocator)); 243 244 if (coder->sequence <= SEQ_BLOCK_INIT) { 245 // There is no incomplete Block waiting to be finished, 246 // thus we can change the whole filter chain. Start by 247 // trying to initialize the Block encoder with the new 248 // chain. This way we detect if the chain is valid. 249 coder->block_encoder_is_initialized = false; 250 coder->block_options.filters = temp; 251 ret = block_encoder_init(coder, allocator); 252 coder->block_options.filters = coder->filters; 253 if (ret != LZMA_OK) 254 goto error; 255 256 coder->block_encoder_is_initialized = true; 257 258 } else if (coder->sequence <= SEQ_BLOCK_ENCODE) { 259 // We are in the middle of a Block. Try to update only 260 // the filter-specific options. 261 ret = coder->block_encoder.update( 262 coder->block_encoder.coder, allocator, 263 filters, reversed_filters); 264 if (ret != LZMA_OK) 265 goto error; 266 } else { 267 // Trying to update the filter chain when we are already 268 // encoding Index or Stream Footer. 269 ret = LZMA_PROG_ERROR; 270 goto error; 271 } 272 273 // Free the options of the old chain. 274 for (size_t i = 0; coder->filters[i].id != LZMA_VLI_UNKNOWN; ++i) 275 lzma_free(coder->filters[i].options, allocator); 276 277 // Copy the new filter chain in place. 278 size_t j = 0; 279 do { 280 coder->filters[j].id = temp[j].id; 281 coder->filters[j].options = temp[j].options; 282 } while (temp[j++].id != LZMA_VLI_UNKNOWN); 283 284 return LZMA_OK; 285 286 error: 287 for (size_t i = 0; temp[i].id != LZMA_VLI_UNKNOWN; ++i) 288 lzma_free(temp[i].options, allocator); 289 290 return ret; 291 } 292 293 294 static lzma_ret 295 stream_encoder_init(lzma_next_coder *next, const lzma_allocator *allocator, 296 const lzma_filter *filters, lzma_check check) 297 { 298 lzma_next_coder_init(&stream_encoder_init, next, allocator); 299 300 if (filters == NULL) 301 return LZMA_PROG_ERROR; 302 303 lzma_stream_coder *coder = next->coder; 304 305 if (coder == NULL) { 306 coder = lzma_alloc(sizeof(lzma_stream_coder), allocator); 307 if (coder == NULL) 308 return LZMA_MEM_ERROR; 309 310 next->coder = coder; 311 next->code = &stream_encode; 312 next->end = &stream_encoder_end; 313 next->update = &stream_encoder_update; 314 315 coder->filters[0].id = LZMA_VLI_UNKNOWN; 316 coder->block_encoder = LZMA_NEXT_CODER_INIT; 317 coder->index_encoder = LZMA_NEXT_CODER_INIT; 318 coder->index = NULL; 319 } 320 321 // Basic initializations 322 coder->sequence = SEQ_STREAM_HEADER; 323 coder->block_options.version = 0; 324 coder->block_options.check = check; 325 326 // Initialize the Index 327 lzma_index_end(coder->index, allocator); 328 coder->index = lzma_index_init(allocator); 329 if (coder->index == NULL) 330 return LZMA_MEM_ERROR; 331 332 // Encode the Stream Header 333 lzma_stream_flags stream_flags = { 334 .version = 0, 335 .check = check, 336 }; 337 return_if_error(lzma_stream_header_encode( 338 &stream_flags, coder->buffer)); 339 340 coder->buffer_pos = 0; 341 coder->buffer_size = LZMA_STREAM_HEADER_SIZE; 342 343 // Initialize the Block encoder. This way we detect unsupported 344 // filter chains when initializing the Stream encoder instead of 345 // giving an error after Stream Header has already been written out. 346 return stream_encoder_update(coder, allocator, filters, NULL); 347 } 348 349 350 extern LZMA_API(lzma_ret) 351 lzma_stream_encoder(lzma_stream *strm, 352 const lzma_filter *filters, lzma_check check) 353 { 354 lzma_next_strm_init(stream_encoder_init, strm, filters, check); 355 356 strm->internal->supported_actions[LZMA_RUN] = true; 357 strm->internal->supported_actions[LZMA_SYNC_FLUSH] = true; 358 strm->internal->supported_actions[LZMA_FULL_FLUSH] = true; 359 strm->internal->supported_actions[LZMA_FULL_BARRIER] = true; 360 strm->internal->supported_actions[LZMA_FINISH] = true; 361 362 return LZMA_OK; 363 } 364