DatanodeProtocol.proto 14 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465
  1. /**
  2. * Licensed to the Apache Software Foundation (ASF) under one
  3. * or more contributor license agreements. See the NOTICE file
  4. * distributed with this work for additional information
  5. * regarding copyright ownership. The ASF licenses this file
  6. * to you under the Apache License, Version 2.0 (the
  7. * "License"); you may not use this file except in compliance
  8. * with the License. You may obtain a copy of the License at
  9. *
  10. * http://www.apache.org/licenses/LICENSE-2.0
  11. *
  12. * Unless required by applicable law or agreed to in writing, software
  13. * distributed under the License is distributed on an "AS IS" BASIS,
  14. * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  15. * See the License for the specific language governing permissions and
  16. * limitations under the License.
  17. */
  18. /**
  19. * These .proto interfaces are private and stable.
  20. * Please see http://wiki.apache.org/hadoop/Compatibility
  21. * for what changes are allowed for a *stable* .proto interface.
  22. */
  23. // This file contains protocol buffers that are used throughout HDFS -- i.e.
  24. // by the client, server, and data transfer protocols.
  25. option java_package = "org.apache.hadoop.hdfs.protocol.proto";
  26. option java_outer_classname = "DatanodeProtocolProtos";
  27. option java_generic_services = true;
  28. option java_generate_equals_and_hash = true;
  29. package hadoop.hdfs.datanode;
  30. import "hdfs.proto";
  31. import "HdfsServer.proto";
  32. /**
  33. * Information to identify a datanode to a namenode
  34. */
  35. message DatanodeRegistrationProto {
  36. required DatanodeIDProto datanodeID = 1; // Datanode information
  37. required StorageInfoProto storageInfo = 2; // Node information
  38. required ExportedBlockKeysProto keys = 3; // Block keys
  39. required string softwareVersion = 4; // Software version of the DN, e.g. "2.0.0"
  40. }
  41. /**
  42. * Commands sent from namenode to the datanodes
  43. */
  44. message DatanodeCommandProto {
  45. enum Type {
  46. BalancerBandwidthCommand = 0;
  47. BlockCommand = 1;
  48. BlockRecoveryCommand = 2;
  49. FinalizeCommand = 3;
  50. KeyUpdateCommand = 4;
  51. RegisterCommand = 5;
  52. UnusedUpgradeCommand = 6;
  53. NullDatanodeCommand = 7;
  54. BlockIdCommand = 8;
  55. }
  56. required Type cmdType = 1; // Type of the command
  57. // One of the following command is available when the corresponding
  58. // cmdType is set
  59. optional BalancerBandwidthCommandProto balancerCmd = 2;
  60. optional BlockCommandProto blkCmd = 3;
  61. optional BlockRecoveryCommandProto recoveryCmd = 4;
  62. optional FinalizeCommandProto finalizeCmd = 5;
  63. optional KeyUpdateCommandProto keyUpdateCmd = 6;
  64. optional RegisterCommandProto registerCmd = 7;
  65. optional BlockIdCommandProto blkIdCmd = 8;
  66. }
  67. /**
  68. * Command sent from namenode to datanode to set the
  69. * maximum bandwidth to be used for balancing.
  70. */
  71. message BalancerBandwidthCommandProto {
  72. // Maximum bandwidth to be used by datanode for balancing
  73. required uint64 bandwidth = 1;
  74. }
  75. /**
  76. * Command to instruct datanodes to perform certain action
  77. * on the given set of blocks.
  78. */
  79. message BlockCommandProto {
  80. enum Action {
  81. TRANSFER = 1; // Transfer blocks to another datanode
  82. INVALIDATE = 2; // Invalidate blocks
  83. SHUTDOWN = 3; // Shutdown the datanode
  84. }
  85. required Action action = 1;
  86. required string blockPoolId = 2;
  87. repeated BlockProto blocks = 3;
  88. repeated DatanodeInfosProto targets = 4;
  89. repeated StorageUuidsProto targetStorageUuids = 5;
  90. repeated StorageTypesProto targetStorageTypes = 6;
  91. }
  92. /**
  93. * Command to instruct datanodes to perform certain action
  94. * on the given set of block IDs.
  95. */
  96. message BlockIdCommandProto {
  97. enum Action {
  98. CACHE = 1;
  99. UNCACHE = 2;
  100. }
  101. required Action action = 1;
  102. required string blockPoolId = 2;
  103. repeated uint64 blockIds = 3 [packed=true];
  104. }
  105. /**
  106. * List of blocks to be recovered by the datanode
  107. */
  108. message BlockRecoveryCommandProto {
  109. repeated RecoveringBlockProto blocks = 1;
  110. }
  111. /**
  112. * Finalize the upgrade at the datanode
  113. */
  114. message FinalizeCommandProto {
  115. required string blockPoolId = 1; // Block pool to be finalized
  116. }
  117. /**
  118. * Update the block keys at the datanode
  119. */
  120. message KeyUpdateCommandProto {
  121. required ExportedBlockKeysProto keys = 1;
  122. }
  123. /**
  124. * Instruct datanode to register with the namenode
  125. */
  126. message RegisterCommandProto {
  127. // void
  128. }
  129. /**
  130. * registration - Information of the datanode registering with the namenode
  131. */
  132. message RegisterDatanodeRequestProto {
  133. required DatanodeRegistrationProto registration = 1; // Datanode info
  134. }
  135. /**
  136. * registration - Update registration of the datanode that successfully
  137. * registered. StorageInfo will be updated to include new
  138. * storage ID if the datanode did not have one in the request.
  139. */
  140. message RegisterDatanodeResponseProto {
  141. required DatanodeRegistrationProto registration = 1; // Datanode info
  142. }
  143. /**
  144. * failedStorageLocations - storage locations that have failed
  145. * lastVolumeFailureDate - date/time of last volume failure
  146. * estimatedCapacityLost - estimate of total capacity lost due to volume failures
  147. */
  148. message VolumeFailureSummaryProto {
  149. repeated string failedStorageLocations = 1;
  150. required uint64 lastVolumeFailureDate = 2;
  151. required uint64 estimatedCapacityLostTotal = 3;
  152. }
  153. /**
  154. * registration - datanode registration information
  155. * capacity - total storage capacity available at the datanode
  156. * dfsUsed - storage used by HDFS
  157. * remaining - remaining storage available for HDFS
  158. * blockPoolUsed - storage used by the block pool
  159. * xmitsInProgress - number of transfers from this datanode to others
  160. * xceiverCount - number of active transceiver threads
  161. * failedVolumes - number of failed volumes. This is redundant with the
  162. * information included in volumeFailureSummary, but the field is retained
  163. * for backwards compatibility.
  164. * cacheCapacity - total cache capacity available at the datanode
  165. * cacheUsed - amount of cache used
  166. * volumeFailureSummary - info about volume failures
  167. * slowPeers - info about peer DataNodes that are suspected to be slow.
  168. * slowDisks - info about DataNode disks that are suspected to be slow.
  169. */
  170. message HeartbeatRequestProto {
  171. required DatanodeRegistrationProto registration = 1; // Datanode info
  172. repeated StorageReportProto reports = 2;
  173. optional uint32 xmitsInProgress = 3 [ default = 0 ];
  174. optional uint32 xceiverCount = 4 [ default = 0 ];
  175. optional uint32 failedVolumes = 5 [ default = 0 ];
  176. optional uint64 cacheCapacity = 6 [ default = 0 ];
  177. optional uint64 cacheUsed = 7 [default = 0 ];
  178. optional VolumeFailureSummaryProto volumeFailureSummary = 8;
  179. optional bool requestFullBlockReportLease = 9 [ default = false ];
  180. repeated SlowPeerReportProto slowPeers = 10;
  181. repeated SlowDiskReportProto slowDisks = 11;
  182. }
  183. /**
  184. * cmds - Commands from namenode to datanode.
  185. * haStatus - Status (from an HA perspective) of the NN sending this response
  186. */
  187. message HeartbeatResponseProto {
  188. repeated DatanodeCommandProto cmds = 1; // Returned commands can be null
  189. required NNHAStatusHeartbeatProto haStatus = 2;
  190. optional RollingUpgradeStatusProto rollingUpgradeStatus = 3;
  191. optional RollingUpgradeStatusProto rollingUpgradeStatusV2 = 4;
  192. optional uint64 fullBlockReportLeaseId = 5 [ default = 0 ];
  193. }
  194. /**
  195. * registration - datanode registration information
  196. * blockPoolID - block pool ID of the reported blocks
  197. * blocks - each block is represented as multiple longs in the array.
  198. * first long represents block ID
  199. * second long represents length
  200. * third long represents gen stamp
  201. * fourth long (if under construction) represents replica state
  202. * context - An optional field containing information about the context
  203. * of this block report.
  204. */
  205. message BlockReportRequestProto {
  206. required DatanodeRegistrationProto registration = 1;
  207. required string blockPoolId = 2;
  208. repeated StorageBlockReportProto reports = 3;
  209. optional BlockReportContextProto context = 4;
  210. }
  211. message BlockReportContextProto {
  212. // The total number of RPCs this block report is broken into.
  213. required int32 totalRpcs = 1;
  214. // The index of the current RPC (zero-based)
  215. required int32 curRpc = 2;
  216. // The unique 64-bit ID of this block report
  217. required int64 id = 3;
  218. // The block report lease ID, or 0 if we are sending without a lease to
  219. // bypass rate-limiting.
  220. optional uint64 leaseId = 4 [ default = 0 ];
  221. }
  222. /**
  223. * Report of blocks in a storage
  224. */
  225. message StorageBlockReportProto {
  226. required DatanodeStorageProto storage = 1; // Storage
  227. repeated uint64 blocks = 2 [packed=true];
  228. optional uint64 numberOfBlocks = 3;
  229. repeated bytes blocksBuffers = 4;
  230. }
  231. /**
  232. * cmd - Command from namenode to the datanode
  233. */
  234. message BlockReportResponseProto {
  235. optional DatanodeCommandProto cmd = 1;
  236. }
  237. /**
  238. * registration - datanode registration information
  239. * blockPoolId - block pool ID of the reported blocks
  240. * blocks - representation of blocks as longs for efficiency reasons
  241. */
  242. message CacheReportRequestProto {
  243. required DatanodeRegistrationProto registration = 1;
  244. required string blockPoolId = 2;
  245. repeated uint64 blocks = 3 [packed=true];
  246. }
  247. message CacheReportResponseProto {
  248. optional DatanodeCommandProto cmd = 1;
  249. }
  250. /**
  251. * Data structure to send received or deleted block information
  252. * from datanode to namenode.
  253. */
  254. message ReceivedDeletedBlockInfoProto {
  255. enum BlockStatus {
  256. RECEIVING = 1; // block being created
  257. RECEIVED = 2; // block creation complete
  258. DELETED = 3;
  259. }
  260. required BlockProto block = 1;
  261. required BlockStatus status = 3;
  262. optional string deleteHint = 2;
  263. }
  264. /**
  265. * List of blocks received and deleted for a storage.
  266. */
  267. message StorageReceivedDeletedBlocksProto {
  268. required string storageUuid = 1 [ deprecated = true ];
  269. repeated ReceivedDeletedBlockInfoProto blocks = 2;
  270. optional DatanodeStorageProto storage = 3; // supersedes storageUuid.
  271. }
  272. /**
  273. * registration - datanode registration information
  274. * blockPoolID - block pool ID of the reported blocks
  275. * blocks - Received/deleted block list
  276. */
  277. message BlockReceivedAndDeletedRequestProto {
  278. required DatanodeRegistrationProto registration = 1;
  279. required string blockPoolId = 2;
  280. repeated StorageReceivedDeletedBlocksProto blocks = 3;
  281. }
  282. /**
  283. * void response
  284. */
  285. message BlockReceivedAndDeletedResponseProto {
  286. }
  287. /**
  288. * registartion - Datanode reporting the error
  289. * errorCode - error code indicating the error
  290. * msg - Free text description of the error
  291. */
  292. message ErrorReportRequestProto {
  293. enum ErrorCode {
  294. NOTIFY = 0; // Error report to be logged at the namenode
  295. DISK_ERROR = 1; // DN has disk errors but still has valid volumes
  296. INVALID_BLOCK = 2; // Command from namenode has invalid block ID
  297. FATAL_DISK_ERROR = 3; // No valid volumes left on datanode
  298. }
  299. required DatanodeRegistrationProto registartion = 1; // Registartion info
  300. required uint32 errorCode = 2; // Error code
  301. required string msg = 3; // Error message
  302. }
  303. /**
  304. * void response
  305. */
  306. message ErrorReportResponseProto {
  307. }
  308. /**
  309. * blocks - list of blocks that are reported as corrupt
  310. */
  311. message ReportBadBlocksRequestProto {
  312. repeated LocatedBlockProto blocks = 1;
  313. }
  314. /**
  315. * void response
  316. */
  317. message ReportBadBlocksResponseProto {
  318. }
  319. /**
  320. * Commit block synchronization request during lease recovery
  321. */
  322. message CommitBlockSynchronizationRequestProto {
  323. required ExtendedBlockProto block = 1;
  324. required uint64 newGenStamp = 2;
  325. required uint64 newLength = 3;
  326. required bool closeFile = 4;
  327. required bool deleteBlock = 5;
  328. repeated DatanodeIDProto newTaragets = 6;
  329. repeated string newTargetStorages = 7;
  330. }
  331. /**
  332. * void response
  333. */
  334. message CommitBlockSynchronizationResponseProto {
  335. }
  336. /**
  337. * Information about a single slow peer that may be reported by
  338. * the DataNode to the NameNode as part of the heartbeat request.
  339. * The message includes the peer's DataNodeId and its
  340. * aggregate packet latency as observed by the reporting DataNode.
  341. * (DataNodeId must be transmitted as a string for protocol compability
  342. * with earlier versions of Hadoop).
  343. *
  344. * The exact choice of the aggregate is opaque to the NameNode but it
  345. * _should_ be chosen consistenly by all DataNodes in the cluster.
  346. * Examples of aggregates are 90th percentile (good) and mean (not so
  347. * good).
  348. */
  349. message SlowPeerReportProto {
  350. optional string dataNodeId = 1;
  351. optional double aggregateLatency = 2;
  352. }
  353. /**
  354. * Information about a single slow disk that may be reported by
  355. * the DataNode to the NameNode as part of the heartbeat request.
  356. * The message includes the disk's basePath, mean metadata op latency,
  357. * mean read io latency and mean write io latency as observed by the DataNode.
  358. */
  359. message SlowDiskReportProto {
  360. optional string basePath = 1;
  361. optional double meanMetadataOpLatency = 2;
  362. optional double meanReadIoLatency = 3;
  363. optional double meanWriteIoLatency = 4;
  364. }
  365. /**
  366. * Protocol used from datanode to the namenode
  367. * See the request and response for details of rpc call.
  368. */
  369. service DatanodeProtocolService {
  370. /**
  371. * Register a datanode at a namenode
  372. */
  373. rpc registerDatanode(RegisterDatanodeRequestProto)
  374. returns(RegisterDatanodeResponseProto);
  375. /**
  376. * Send heartbeat from datanode to namenode
  377. */
  378. rpc sendHeartbeat(HeartbeatRequestProto) returns(HeartbeatResponseProto);
  379. /**
  380. * Report blocks at a given datanode to the namenode
  381. */
  382. rpc blockReport(BlockReportRequestProto) returns(BlockReportResponseProto);
  383. /**
  384. * Report cached blocks at a datanode to the namenode
  385. */
  386. rpc cacheReport(CacheReportRequestProto) returns(CacheReportResponseProto);
  387. /**
  388. * Incremental block report from the DN. This contains info about recently
  389. * received and deleted blocks, as well as when blocks start being
  390. * received.
  391. */
  392. rpc blockReceivedAndDeleted(BlockReceivedAndDeletedRequestProto)
  393. returns(BlockReceivedAndDeletedResponseProto);
  394. /**
  395. * Report from a datanode of an error to the active namenode.
  396. * Used for debugging.
  397. */
  398. rpc errorReport(ErrorReportRequestProto) returns(ErrorReportResponseProto);
  399. /**
  400. * Request the version
  401. */
  402. rpc versionRequest(VersionRequestProto) returns(VersionResponseProto);
  403. /**
  404. * Report corrupt blocks at the specified location
  405. */
  406. rpc reportBadBlocks(ReportBadBlocksRequestProto) returns(ReportBadBlocksResponseProto);
  407. /**
  408. * Commit block synchronization during lease recovery.
  409. */
  410. rpc commitBlockSynchronization(CommitBlockSynchronizationRequestProto)
  411. returns(CommitBlockSynchronizationResponseProto);
  412. }