123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158 |
- /**
- * Licensed to the Apache Software Foundation (ASF) under one
- * or more contributor license agreements. See the NOTICE file
- * distributed with this work for additional information
- * regarding copyright ownership. The ASF licenses this file
- * to you under the Apache License, Version 2.0 (the
- * "License"); you may not use this file except in compliance
- * with the License. You may obtain a copy of the License at
- *
- * http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
- */
- #ifndef BLOCK_READER_H_
- #define BLOCK_READER_H_
- #include "hdfspp/status.h"
- #include "common/async_stream.h"
- #include "common/cancel_tracker.h"
- #include "common/new_delete.h"
- #include "datatransfer.pb.h"
- #include "connection/datanodeconnection.h"
- #include <memory>
- namespace hdfs {
- struct CacheStrategy {
- bool drop_behind_specified;
- bool drop_behind;
- bool read_ahead_specified;
- unsigned long long read_ahead;
- CacheStrategy()
- : drop_behind_specified(false), drop_behind(false),
- read_ahead_specified(false), read_ahead(false) {}
- };
- enum DropBehindStrategy {
- kUnspecified = 0,
- kEnableDropBehind = 1,
- kDisableDropBehind = 2,
- };
- enum EncryptionScheme {
- kNone = 0,
- kAESCTRNoPadding = 1,
- };
- struct BlockReaderOptions {
- bool verify_checksum;
- CacheStrategy cache_strategy;
- EncryptionScheme encryption_scheme;
- BlockReaderOptions()
- : verify_checksum(true), encryption_scheme(EncryptionScheme::kNone) {}
- };
- /**
- * Handles the operational state of request and reading a block (or portion of
- * a block) from a DataNode.
- *
- * Threading model: not thread-safe.
- * Lifecycle: should be created, used for a single read, then freed.
- */
- class BlockReader {
- public:
- MEMCHECKED_CLASS(BlockReader)
- virtual void AsyncReadBlock(
- const std::string & client_name,
- const hadoop::hdfs::LocatedBlockProto &block, size_t offset,
- const MutableBuffers &buffers,
- const std::function<void(const Status &, size_t)> handler) = 0;
- virtual void AsyncReadPacket(
- const MutableBuffers &buffers,
- const std::function<void(const Status &, size_t bytes_transferred)> &handler) = 0;
- virtual void AsyncRequestBlock(
- const std::string &client_name,
- const hadoop::hdfs::ExtendedBlockProto *block,
- uint64_t length,
- uint64_t offset,
- const std::function<void(Status)> &handler) = 0;
- virtual void CancelOperation() = 0;
- };
- class BlockReaderImpl
- : public BlockReader, public std::enable_shared_from_this<BlockReaderImpl> {
- public:
- explicit BlockReaderImpl(const BlockReaderOptions &options, std::shared_ptr<DataNodeConnection> dn,
- CancelHandle cancel_state)
- : dn_(dn), state_(kOpen), options_(options),
- chunk_padding_bytes_(0), cancel_state_(cancel_state) {}
- virtual void AsyncReadPacket(
- const MutableBuffers &buffers,
- const std::function<void(const Status &, size_t bytes_transferred)> &handler) override;
- virtual void AsyncRequestBlock(
- const std::string &client_name,
- const hadoop::hdfs::ExtendedBlockProto *block,
- uint64_t length,
- uint64_t offset,
- const std::function<void(Status)> &handler) override;
- virtual void AsyncReadBlock(
- const std::string & client_name,
- const hadoop::hdfs::LocatedBlockProto &block, size_t offset,
- const MutableBuffers &buffers,
- const std::function<void(const Status &, size_t)> handler) override;
- virtual void CancelOperation() override;
- size_t ReadPacket(const MutableBuffers &buffers, Status *status);
- Status RequestBlock(
- const std::string &client_name,
- const hadoop::hdfs::ExtendedBlockProto *block,
- uint64_t length,
- uint64_t offset);
- private:
- struct RequestBlockContinuation;
- struct ReadBlockContinuation;
- struct ReadPacketHeader;
- struct ReadChecksum;
- struct ReadPadding;
- struct ReadData;
- struct AckRead;
- enum State {
- kOpen,
- kReadPacketHeader,
- kReadChecksum,
- kReadPadding,
- kReadData,
- kFinished,
- };
- std::shared_ptr<DataNodeConnection> dn_;
- hadoop::hdfs::PacketHeaderProto header_;
- State state_;
- BlockReaderOptions options_;
- size_t packet_len_;
- int packet_data_read_bytes_;
- int chunk_padding_bytes_;
- long long bytes_to_read_;
- std::vector<char> checksum_;
- CancelHandle cancel_state_;
- };
- }
- #endif
|