// Copyright 2010 Google Inc. All Rights Reserved. // // Licensed under the Apache License, Version 2.0 (the "License"); // you may not use this file except in compliance with the License. // You may obtain a copy of the License at // // http://www.apache.org/licenses/LICENSE-2.0 // // Unless required by applicable law or agreed to in writing, software // distributed under the License is distributed on an "AS IS" BASIS, // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. // See the License for the specific language governing permissions and // limitations under the License. // // Author: jdtang@google.com (Jonathan Tang) #include "string_buffer.h" #include #include #include #include #include "string_piece.h" #include "util.h" struct _GumboParser; static const size_t kDefaultStringBufferSize = 10; static void maybe_resize_string_buffer( struct _GumboParser* parser, size_t additional_chars, GumboStringBuffer* buffer) { size_t new_length = buffer->length + additional_chars; size_t new_capacity = buffer->capacity; while (new_capacity < new_length) { new_capacity *= 2; } if (new_capacity != buffer->capacity) { char* new_data = gumbo_parser_allocate(parser, new_capacity); memcpy(new_data, buffer->data, buffer->length); gumbo_parser_deallocate(parser, buffer->data); buffer->data = new_data; buffer->capacity = new_capacity; } } void gumbo_string_buffer_init( struct _GumboParser* parser, GumboStringBuffer* output) { output->data = gumbo_parser_allocate(parser, kDefaultStringBufferSize); output->length = 0; output->capacity = kDefaultStringBufferSize; } void gumbo_string_buffer_reserve( struct _GumboParser* parser, size_t min_capacity, GumboStringBuffer* output) { maybe_resize_string_buffer(parser, min_capacity - output->length, output); } void gumbo_string_buffer_append_codepoint( struct _GumboParser* parser, int c, GumboStringBuffer* output) { // num_bytes is actually the number of continuation bytes, 1 less than the // total number of bytes. This is done to keep the loop below simple and // should probably change if we unroll it. int num_bytes, prefix; if (c <= 0x7f) { num_bytes = 0; prefix = 0; } else if (c <= 0x7ff) { num_bytes = 1; prefix = 0xc0; } else if (c <= 0xffff) { num_bytes = 2; prefix = 0xe0; } else { num_bytes = 3; prefix = 0xf0; } maybe_resize_string_buffer(parser, num_bytes + 1, output); output->data[output->length++] = prefix | (c >> (num_bytes * 6)); for (int i = num_bytes - 1; i >= 0; --i) { output->data[output->length++] = 0x80 | (0x3f & (c >> (i * 6))); } } void gumbo_string_buffer_append_string( struct _GumboParser* parser, GumboStringPiece* str, GumboStringBuffer* output) { maybe_resize_string_buffer(parser, str->length, output); memcpy(output->data + output->length, str->data, str->length); output->length += str->length; } char* gumbo_string_buffer_to_string( struct _GumboParser* parser, GumboStringBuffer* input) { char* buffer = gumbo_parser_allocate(parser, input->length + 1); memcpy(buffer, input->data, input->length); buffer[input->length] = '\0'; return buffer; } void gumbo_string_buffer_destroy( struct _GumboParser* parser, GumboStringBuffer* buffer) { gumbo_parser_deallocate(parser, buffer->data); }