Mercurial > hgrepos > Python2 > PyMuPDF
diff mupdf-source/thirdparty/gumbo-parser/src/string_buffer.c @ 2:b50eed0cc0ef upstream
ADD: MuPDF v1.26.7: the MuPDF source as downloaded by a default build of PyMuPDF 1.26.4.
The directory name has changed: no version number in the expanded directory now.
| author | Franz Glasner <fzglas.hg@dom66.de> |
|---|---|
| date | Mon, 15 Sep 2025 11:43:07 +0200 |
| parents | |
| children |
line wrap: on
line diff
--- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/mupdf-source/thirdparty/gumbo-parser/src/string_buffer.c Mon Sep 15 11:43:07 2025 +0200 @@ -0,0 +1,110 @@ +// Copyright 2010 Google Inc. All Rights Reserved. +// +// Licensed under the Apache License, Version 2.0 (the "License"); +// you may not use this file except in compliance with the License. +// You may obtain a copy of the License at +// +// http://www.apache.org/licenses/LICENSE-2.0 +// +// Unless required by applicable law or agreed to in writing, software +// distributed under the License is distributed on an "AS IS" BASIS, +// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. +// See the License for the specific language governing permissions and +// limitations under the License. +// +// Author: jdtang@google.com (Jonathan Tang) + +#include "string_buffer.h" + +#include <assert.h> +#include <stdlib.h> +#include <string.h> +#include <strings.h> + +#include "string_piece.h" +#include "util.h" + +struct GumboInternalParser; + +// Size chosen via statistical analysis of ~60K websites. +// 99% of text nodes and 98% of attribute names/values fit in this initial size. +static const size_t kDefaultStringBufferSize = 5; + +static void maybe_resize_string_buffer(struct GumboInternalParser* parser, + size_t additional_chars, GumboStringBuffer* buffer) { + size_t new_length = buffer->length + additional_chars; + size_t new_capacity = buffer->capacity; + while (new_capacity < new_length) { + new_capacity *= 2; + } + if (new_capacity != buffer->capacity) { + char* new_data = gumbo_parser_allocate(parser, new_capacity); + memcpy(new_data, buffer->data, buffer->length); + gumbo_parser_deallocate(parser, buffer->data); + buffer->data = new_data; + buffer->capacity = new_capacity; + } +} + +void gumbo_string_buffer_init( + struct GumboInternalParser* parser, GumboStringBuffer* output) { + output->data = gumbo_parser_allocate(parser, kDefaultStringBufferSize); + output->length = 0; + output->capacity = kDefaultStringBufferSize; +} + +void gumbo_string_buffer_reserve(struct GumboInternalParser* parser, + size_t min_capacity, GumboStringBuffer* output) { + maybe_resize_string_buffer(parser, min_capacity - output->length, output); +} + +void gumbo_string_buffer_append_codepoint( + struct GumboInternalParser* parser, int c, GumboStringBuffer* output) { + // num_bytes is actually the number of continuation bytes, 1 less than the + // total number of bytes. This is done to keep the loop below simple and + // should probably change if we unroll it. + int num_bytes, prefix; + if (c <= 0x7f) { + num_bytes = 0; + prefix = 0; + } else if (c <= 0x7ff) { + num_bytes = 1; + prefix = 0xc0; + } else if (c <= 0xffff) { + num_bytes = 2; + prefix = 0xe0; + } else { + num_bytes = 3; + prefix = 0xf0; + } + maybe_resize_string_buffer(parser, num_bytes + 1, output); + output->data[output->length++] = prefix | (c >> (num_bytes * 6)); + for (int i = num_bytes - 1; i >= 0; --i) { + output->data[output->length++] = 0x80 | (0x3f & (c >> (i * 6))); + } +} + +void gumbo_string_buffer_append_string(struct GumboInternalParser* parser, + GumboStringPiece* str, GumboStringBuffer* output) { + maybe_resize_string_buffer(parser, str->length, output); + memcpy(output->data + output->length, str->data, str->length); + output->length += str->length; +} + +char* gumbo_string_buffer_to_string( + struct GumboInternalParser* parser, GumboStringBuffer* input) { + char* buffer = gumbo_parser_allocate(parser, input->length + 1); + memcpy(buffer, input->data, input->length); + buffer[input->length] = '\0'; + return buffer; +} + +void gumbo_string_buffer_clear( + struct GumboInternalParser* parser, GumboStringBuffer* input) { + input->length = 0; +} + +void gumbo_string_buffer_destroy( + struct GumboInternalParser* parser, GumboStringBuffer* buffer) { + gumbo_parser_deallocate(parser, buffer->data); +}
