/* * Copyright (c) Meta Platforms, Inc. and affiliates. * * Licensed under the Apache License, Version 2.0 (the "License"); * you may not use this file except in compliance with the License. * You may obtain a copy of the License at * * http://www.apache.org/licenses/LICENSE-2.0 * * Unless required by applicable law or agreed to in writing, software * distributed under the License is distributed on an "AS IS" BASIS, * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. * See the License for the specific language governing permissions and * limitations under the License. */ #pragma once #include #include #include #include #include #include #include #include #include namespace apache { namespace thrift { namespace op { namespace detail { // Helpers for combining string or binary buffers. template uint32_t combineBuf(Accumulator& acc, const Buffer& buffer, size_t size) { uint32_t limit = std::numeric_limits::max(); if (size > limit) { protocol::TProtocolException::throwExceededSizeLimit(size, limit); } acc.beginOrdered(); acc.combine(static_cast(size)); acc.combine(buffer); acc.endOrdered(); return 0; } template uint32_t combineBuf(Accumulator& acc, const Buffer& buf) { return combineBuf( acc, folly::ByteRange( reinterpret_cast(buf.data()), buf.size()), buf.size()); } template uint32_t combineBuf(Accumulator& acc, const folly::IOBuf& buf) { return combineBuf(acc, buf, buf.computeChainDataLength()); } template uint32_t combineBuf( Accumulator& acc, const std::unique_ptr& buf) { return buf == nullptr ? combineBuf(acc, folly::ByteRange{}) : combineBuf(acc, *buf); } template void beginContainer(Accumulator& acc, uint32_t size) { acc.beginOrdered(); acc.combine(static_cast(size)); } template uint32_t endContainer(Accumulator& acc) { return (acc.endOrdered(), 0); } template FOLLY_NODISCARD auto makeContainerHashGuard(Accumulator& acc, uint32_t size) { beginContainer(acc, size); return folly::makeGuard([&] { endContainer(acc); }); } /** * A deterministic one-way/write-only custom protocol that guarantees the * accumulated results to be stable and consistent across different languages * and implementations. Protocol wraps an accumulator and allows users to * provide custom implementations for it. * * Names: * To enable better development experience we do not include struct names, * field names and paths into the hash computation, but we do include field * id. This way refactoring to rename or move a struct around will not change * the computed hash values. One thing to note here if the hashes are used for * signatures or keyed mac computations you might want to use a different key * per struct to avoid collisions in case struct layouts match. * * Ordering: * Fields, Maps and Sets are treated as unordered collections. * Lists, Prefixes and Map Values are treated as ordered collections. * Re-arranging fields in a struct will not change the hash if you preserve * field ids. The specifics of order handling is delegated to Accumulator * implementation. * * Prefixing: * To have a better collision protection all fields are prefixed with a type * tag that goes into the hash computation. All dynamic sized (non-scalar) * types also get a size prefix. */ // TODO(afuller): Do not use a protocol for this, which requires the custom // protocol header to be included by the caller and for adapted types to be // converted to thrift before being hashed, even if they can be hashed // directly (via the a hook on the given Adapter). Instead add ThriftType // info and accessors to the struct definition, and use that. template class HashProtocol { public: explicit HashProtocol(Accumulator& accumulator) : acc_(accumulator) {} static constexpr bool kSortKeys() { return false; } uint32_t writeStructBegin(const char*) { return (acc_.beginUnordered(), 0); } uint32_t writeStructEnd() { return (acc_.endUnordered(), 0); } uint32_t writeFieldBegin(const char*, protocol::TType, int16_t id) { return (acc_.beginOrdered(), writeI16(id), 0); } uint32_t writeFieldEnd() { return (acc_.endOrdered(), 0); } uint32_t writeFieldStop() { return 0; } uint32_t writeMapBegin(protocol::TType, protocol::TType, uint32_t size) { return (beginContainer(acc_, size), acc_.beginUnordered(), 0); } uint32_t writeMapValueBegin() { return (acc_.beginOrdered(), 0); } uint32_t writeMapValueEnd() { return (acc_.endOrdered(), 0); } uint32_t writeMapEnd() { return (acc_.endUnordered(), endContainer(acc_)); } uint32_t writeListBegin(protocol::TType, uint32_t size) { return (beginContainer(acc_, size), acc_.beginOrdered(), 0); } uint32_t writeListEnd() { return (acc_.endOrdered(), endContainer(acc_)); } uint32_t writeSetBegin(protocol::TType, uint32_t size) { return (beginContainer(acc_, size), acc_.beginUnordered(), 0); } uint32_t writeSetEnd() { return (acc_.endUnordered(), endContainer(acc_)); } uint32_t writeBool(bool val) { return (acc_.combine(val), 0); } uint32_t writeByte(int8_t val) { return (acc_.combine(val), 0); } uint32_t writeI16(int16_t val) { return (acc_.combine(val), 0); } uint32_t writeI32(int32_t val) { return (acc_.combine(val), 0); } uint32_t writeI64(int64_t val) { return (acc_.combine(val), 0); } uint32_t writeDouble(double val) { return (acc_.combine(val), 0); } uint32_t writeFloat(float val) { return (acc_.combine(val), 0); } uint32_t writeString(folly::StringPiece val) { return combineBuf(acc_, val); } uint32_t writeBinary(folly::StringPiece val) { return combineBuf(acc_, val); } uint32_t writeBinary(folly::ByteRange val) { return combineBuf(acc_, val); } uint32_t writeBinary(const std::unique_ptr& val) { return combineBuf(acc_, val); } uint32_t writeBinary(const folly::IOBuf& val) { return combineBuf(acc_, val); } private: Accumulator& acc_; }; } // namespace detail } // namespace op } // namespace thrift } // namespace apache