| /* |
| * Copyright (C) 2018 The Android Open Source Project |
| * |
| * Licensed under the Apache License, Version 2.0 (the "License"); |
| * you may not use this file except in compliance with the License. |
| * You may obtain a copy of the License at |
| * |
| * http://www.apache.org/licenses/LICENSE-2.0 |
| * |
| * Unless required by applicable law or agreed to in writing, software |
| * distributed under the License is distributed on an "AS IS" BASIS, |
| * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. |
| * See the License for the specific language governing permissions and |
| * limitations under the License. |
| */ |
| |
| #include "perfetto/protozero/proto_decoder.h" |
| |
| #include <string.h> |
| |
| #include <cinttypes> |
| #include <limits> |
| #include <memory> |
| |
| #include "perfetto/base/compiler.h" |
| #include "perfetto/base/logging.h" |
| #include "perfetto/ext/base/utils.h" |
| #include "perfetto/protozero/proto_utils.h" |
| |
| namespace protozero { |
| |
| using namespace proto_utils; |
| |
| #if !PERFETTO_IS_LITTLE_ENDIAN() |
| #error Unimplemented for big endian archs. |
| #endif |
| |
| namespace { |
| |
| struct ParseFieldResult { |
| enum ParseResult { kAbort, kSkip, kOk }; |
| ParseResult parse_res; |
| const uint8_t* next; |
| Field field; |
| }; |
| |
| // Parses one field and returns the field itself and a pointer to the next |
| // field to parse. If parsing fails, the returned |next| == |buffer|. |
| ParseFieldResult ParseOneField(const uint8_t* const buffer, |
| const uint8_t* const end) { |
| ParseFieldResult res{ParseFieldResult::kAbort, buffer, Field{}}; |
| |
| // The first byte of a proto field is structured as follows: |
| // The least 3 significant bits determine the field type. |
| // The most 5 significant bits determine the field id. If MSB == 1, the |
| // field id continues on the next bytes following the VarInt encoding. |
| const uint8_t kFieldTypeNumBits = 3; |
| const uint64_t kFieldTypeMask = (1 << kFieldTypeNumBits) - 1; // 0000 0111; |
| const uint8_t* pos = buffer; |
| |
| // If we've already hit the end, just return an invalid field. |
| if (PERFETTO_UNLIKELY(pos >= end)) |
| return res; |
| |
| uint64_t preamble = 0; |
| if (PERFETTO_LIKELY(*pos < 0x80)) { // Fastpath for fields with ID < 16. |
| preamble = *(pos++); |
| } else { |
| const uint8_t* next = ParseVarInt(pos, end, &preamble); |
| if (PERFETTO_UNLIKELY(pos == next)) |
| return res; |
| pos = next; |
| } |
| |
| uint32_t field_id = static_cast<uint32_t>(preamble >> kFieldTypeNumBits); |
| if (field_id == 0 || pos >= end) |
| return res; |
| |
| auto field_type = static_cast<uint8_t>(preamble & kFieldTypeMask); |
| const uint8_t* new_pos = pos; |
| uint64_t int_value = 0; |
| uint64_t size = 0; |
| |
| switch (field_type) { |
| case static_cast<uint8_t>(ProtoWireType::kVarInt): { |
| new_pos = ParseVarInt(pos, end, &int_value); |
| |
| // new_pos not being greater than pos means ParseVarInt could not fully |
| // parse the number. This is because we are out of space in the buffer. |
| // Set the id to zero and return but don't update the offset so a future |
| // read can read this field. |
| if (PERFETTO_UNLIKELY(new_pos == pos)) |
| return res; |
| |
| break; |
| } |
| |
| case static_cast<uint8_t>(ProtoWireType::kLengthDelimited): { |
| uint64_t payload_length; |
| new_pos = ParseVarInt(pos, end, &payload_length); |
| if (PERFETTO_UNLIKELY(new_pos == pos)) |
| return res; |
| |
| // ParseVarInt guarantees that |new_pos| <= |end| when it succeeds; |
| if (payload_length > static_cast<uint64_t>(end - new_pos)) |
| return res; |
| |
| const uintptr_t payload_start = reinterpret_cast<uintptr_t>(new_pos); |
| int_value = payload_start; |
| size = payload_length; |
| new_pos += payload_length; |
| break; |
| } |
| |
| case static_cast<uint8_t>(ProtoWireType::kFixed64): { |
| new_pos = pos + sizeof(uint64_t); |
| if (PERFETTO_UNLIKELY(new_pos > end)) |
| return res; |
| memcpy(&int_value, pos, sizeof(uint64_t)); |
| break; |
| } |
| |
| case static_cast<uint8_t>(ProtoWireType::kFixed32): { |
| new_pos = pos + sizeof(uint32_t); |
| if (PERFETTO_UNLIKELY(new_pos > end)) |
| return res; |
| memcpy(&int_value, pos, sizeof(uint32_t)); |
| break; |
| } |
| |
| default: |
| PERFETTO_DLOG("Invalid proto field type: %u", field_type); |
| return res; |
| } |
| |
| res.next = new_pos; |
| |
| if (PERFETTO_UNLIKELY(field_id > Field::kMaxId)) { |
| PERFETTO_DLOG("Skipping field %" PRIu32 " because its id > %" PRIu32, |
| field_id, Field::kMaxId); |
| res.parse_res = ParseFieldResult::kSkip; |
| return res; |
| } |
| |
| if (PERFETTO_UNLIKELY(size > proto_utils::kMaxMessageLength)) { |
| PERFETTO_DLOG("Skipping field %" PRIu32 " because it's too big (%" PRIu64 |
| " KB)", |
| field_id, size / 1024); |
| res.parse_res = ParseFieldResult::kSkip; |
| return res; |
| } |
| |
| res.parse_res = ParseFieldResult::kOk; |
| res.field.initialize(field_id, field_type, int_value, |
| static_cast<uint32_t>(size)); |
| return res; |
| } |
| |
| } // namespace |
| |
| Field ProtoDecoder::FindField(uint32_t field_id) { |
| Field res{}; |
| auto old_position = read_ptr_; |
| read_ptr_ = begin_; |
| for (auto f = ReadField(); f.valid(); f = ReadField()) { |
| if (f.id() == field_id) { |
| res = f; |
| break; |
| } |
| } |
| read_ptr_ = old_position; |
| return res; |
| } |
| |
| Field ProtoDecoder::ReadField() { |
| ParseFieldResult res; |
| do { |
| res = ParseOneField(read_ptr_, end_); |
| read_ptr_ = res.next; |
| } while (PERFETTO_UNLIKELY(res.parse_res == ParseFieldResult::kSkip)); |
| return res.field; |
| } |
| |
| void TypedProtoDecoderBase::ParseAllFields() { |
| const uint8_t* cur = begin_; |
| ParseFieldResult res; |
| for (;;) { |
| res = ParseOneField(cur, end_); |
| PERFETTO_DCHECK(res.parse_res != ParseFieldResult::kOk || res.next != cur); |
| cur = res.next; |
| if (PERFETTO_UNLIKELY(res.parse_res == ParseFieldResult::kSkip)) |
| continue; |
| if (PERFETTO_UNLIKELY(res.parse_res == ParseFieldResult::kAbort)) |
| break; |
| |
| PERFETTO_DCHECK(res.parse_res == ParseFieldResult::kOk); |
| PERFETTO_DCHECK(res.field.valid()); |
| auto field_id = res.field.id(); |
| if (PERFETTO_UNLIKELY(field_id >= num_fields_)) |
| continue; |
| |
| // There are two reasons why we might want to expand the heap capacity: |
| // 1. We are writing a non-repeated field, which has an id > |
| // INITIAL_STACK_CAPACITY. In this case ExpandHeapStorage() ensures to |
| // allocate at least (num_fields_ + 1) slots. |
| // 2. We are writing a repeated field but ran out of capacity. |
| if (PERFETTO_UNLIKELY(field_id >= size_ || size_ >= capacity_)) |
| ExpandHeapStorage(); |
| |
| PERFETTO_DCHECK(field_id < size_); |
| Field* fld = &fields_[field_id]; |
| if (PERFETTO_LIKELY(!fld->valid())) { |
| // This is the first time we see this field. |
| *fld = std::move(res.field); |
| } else { |
| // Repeated field case. |
| // In this case we need to: |
| // 1. Append the last value of the field to end of the repeated field |
| // storage. |
| // 2. Replace the default instance at offset |field_id| with the current |
| // value. This is because in case of repeated field a call to Get(X) is |
| // supposed to return the last value of X, not the first one. |
| // This is so that the RepeatedFieldIterator will iterate in the right |
| // order, see comments on RepeatedFieldIterator. |
| PERFETTO_DCHECK(size_ < capacity_); |
| fields_[size_++] = *fld; |
| *fld = std::move(res.field); |
| } |
| } |
| read_ptr_ = res.next; |
| } |
| |
| void TypedProtoDecoderBase::ExpandHeapStorage() { |
| // When we expand the heap we must ensure that we have at very last capacity |
| // to deal with all known fields plus at least one repeated field. We go +2048 |
| // here based on observations on a large 4GB android trace. This is to avoid |
| // trivial re-allocations when dealing with repeated fields of a message that |
| // has > INITIAL_STACK_CAPACITY fields. |
| const uint32_t min_capacity = num_fields_ + 2048; // Any num >= +1 will do. |
| const uint32_t new_capacity = std::max(capacity_ * 2, min_capacity); |
| PERFETTO_CHECK(new_capacity > size_ && new_capacity > num_fields_); |
| std::unique_ptr<Field[]> new_storage(new Field[new_capacity]); |
| |
| static_assert(std::is_trivially_constructible<Field>::value, |
| "Field must be trivially constructible"); |
| static_assert(std::is_trivially_copyable<Field>::value, |
| "Field must be trivially copyable"); |
| |
| // Zero-initialize the slots for known field IDs slots, as they can be |
| // randomly accessed. Instead, there is no need to initialize the repeated |
| // slots, because they are written linearly with no gaps and are always |
| // initialized before incrementing |size_|. |
| const uint32_t new_size = std::max(size_, num_fields_); |
| memset(&new_storage[size_], 0, sizeof(Field) * (new_size - size_)); |
| |
| memcpy(&new_storage[0], fields_, sizeof(Field) * size_); |
| |
| heap_storage_ = std::move(new_storage); |
| fields_ = &heap_storage_[0]; |
| capacity_ = new_capacity; |
| size_ = new_size; |
| } |
| |
| } // namespace protozero |