hdfs.proto 16 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574
  1. /**
  2. * Licensed to the Apache Software Foundation (ASF) under one
  3. * or more contributor license agreements. See the NOTICE file
  4. * distributed with this work for additional information
  5. * regarding copyright ownership. The ASF licenses this file
  6. * to you under the Apache License, Version 2.0 (the
  7. * "License"); you may not use this file except in compliance
  8. * with the License. You may obtain a copy of the License at
  9. *
  10. * http://www.apache.org/licenses/LICENSE-2.0
  11. *
  12. * Unless required by applicable law or agreed to in writing, software
  13. * distributed under the License is distributed on an "AS IS" BASIS,
  14. * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  15. * See the License for the specific language governing permissions and
  16. * limitations under the License.
  17. */
  18. /**
  19. * These .proto interfaces are private and stable.
  20. * Please see http://wiki.apache.org/hadoop/Compatibility
  21. * for what changes are allowed for a *stable* .proto interface.
  22. */
  23. // This file contains protocol buffers that are used throughout HDFS -- i.e.
  24. // by the client, server, and data transfer protocols.
  25. option java_package = "org.apache.hadoop.hdfs.protocol.proto";
  26. option java_outer_classname = "HdfsProtos";
  27. option java_generate_equals_and_hash = true;
  28. package hadoop.hdfs;
  29. import "Security.proto";
  30. /**
  31. * Extended block idenfies a block
  32. */
  33. message ExtendedBlockProto {
  34. required string poolId = 1; // Block pool id - gloablly unique across clusters
  35. required uint64 blockId = 2; // the local id within a pool
  36. required uint64 generationStamp = 3;
  37. optional uint64 numBytes = 4 [default = 0]; // len does not belong in ebid
  38. // here for historical reasons
  39. }
  40. /**
  41. * Identifies a Datanode
  42. */
  43. message DatanodeIDProto {
  44. required string ipAddr = 1; // IP address
  45. required string hostName = 2; // hostname
  46. required string datanodeUuid = 3; // UUID assigned to the Datanode. For
  47. // upgraded clusters this is the same
  48. // as the original StorageID of the
  49. // Datanode.
  50. required uint32 xferPort = 4; // data streaming port
  51. required uint32 infoPort = 5; // datanode http port
  52. required uint32 ipcPort = 6; // ipc server port
  53. optional uint32 infoSecurePort = 7 [default = 0]; // datanode https port
  54. }
  55. /**
  56. * Datanode local information
  57. */
  58. message DatanodeLocalInfoProto {
  59. required string softwareVersion = 1;
  60. required string configVersion = 2;
  61. required uint64 uptime = 3;
  62. }
  63. /**
  64. * Datanode volume information
  65. */
  66. message DatanodeVolumeInfoProto {
  67. required string path = 1;
  68. required StorageTypeProto storageType = 2;
  69. required uint64 usedSpace = 3;
  70. required uint64 freeSpace = 4;
  71. required uint64 reservedSpace = 5;
  72. required uint64 reservedSpaceForReplicas = 6;
  73. required uint64 numBlocks = 7;
  74. }
  75. /**
  76. * DatanodeInfo array
  77. */
  78. message DatanodeInfosProto {
  79. repeated DatanodeInfoProto datanodes = 1;
  80. }
  81. /**
  82. * The status of a Datanode
  83. */
  84. message DatanodeInfoProto {
  85. required DatanodeIDProto id = 1;
  86. optional uint64 capacity = 2 [default = 0];
  87. optional uint64 dfsUsed = 3 [default = 0];
  88. optional uint64 remaining = 4 [default = 0];
  89. optional uint64 blockPoolUsed = 5 [default = 0];
  90. optional uint64 lastUpdate = 6 [default = 0];
  91. optional uint32 xceiverCount = 7 [default = 0];
  92. optional string location = 8;
  93. optional uint64 nonDfsUsed = 9;
  94. enum AdminState {
  95. NORMAL = 0;
  96. DECOMMISSION_INPROGRESS = 1;
  97. DECOMMISSIONED = 2;
  98. ENTERING_MAINTENANCE = 3;
  99. IN_MAINTENANCE = 4;
  100. }
  101. optional AdminState adminState = 10 [default = NORMAL];
  102. optional uint64 cacheCapacity = 11 [default = 0];
  103. optional uint64 cacheUsed = 12 [default = 0];
  104. optional uint64 lastUpdateMonotonic = 13 [default = 0];
  105. optional string upgradeDomain = 14;
  106. optional uint64 lastBlockReportTime = 15 [default = 0];
  107. optional uint64 lastBlockReportMonotonic = 16 [default = 0];
  108. }
  109. /**
  110. * Represents a storage available on the datanode
  111. */
  112. message DatanodeStorageProto {
  113. enum StorageState {
  114. NORMAL = 0;
  115. READ_ONLY_SHARED = 1;
  116. }
  117. required string storageUuid = 1;
  118. optional StorageState state = 2 [default = NORMAL];
  119. optional StorageTypeProto storageType = 3 [default = DISK];
  120. }
  121. message StorageReportProto {
  122. required string storageUuid = 1 [ deprecated = true ];
  123. optional bool failed = 2 [ default = false ];
  124. optional uint64 capacity = 3 [ default = 0 ];
  125. optional uint64 dfsUsed = 4 [ default = 0 ];
  126. optional uint64 remaining = 5 [ default = 0 ];
  127. optional uint64 blockPoolUsed = 6 [ default = 0 ];
  128. optional DatanodeStorageProto storage = 7; // supersedes StorageUuid
  129. optional uint64 nonDfsUsed = 8;
  130. }
  131. /**
  132. * Summary of a file or directory
  133. */
  134. message ContentSummaryProto {
  135. required uint64 length = 1;
  136. required uint64 fileCount = 2;
  137. required uint64 directoryCount = 3;
  138. required uint64 quota = 4;
  139. required uint64 spaceConsumed = 5;
  140. required uint64 spaceQuota = 6;
  141. optional StorageTypeQuotaInfosProto typeQuotaInfos = 7;
  142. optional uint64 snapshotLength = 8;
  143. optional uint64 snapshotFileCount = 9;
  144. optional uint64 snapshotDirectoryCount = 10;
  145. optional uint64 snapshotSpaceConsumed = 11;
  146. }
  147. /**
  148. * Summary of quota usage of a directory
  149. */
  150. message QuotaUsageProto {
  151. required uint64 fileAndDirectoryCount = 1;
  152. required uint64 quota = 2;
  153. required uint64 spaceConsumed = 3;
  154. required uint64 spaceQuota = 4;
  155. optional StorageTypeQuotaInfosProto typeQuotaInfos = 5;
  156. }
  157. /**
  158. * Storage type quota and usage information of a file or directory
  159. */
  160. message StorageTypeQuotaInfosProto {
  161. repeated StorageTypeQuotaInfoProto typeQuotaInfo = 1;
  162. }
  163. message StorageTypeQuotaInfoProto {
  164. required StorageTypeProto type = 1;
  165. required uint64 quota = 2;
  166. required uint64 consumed = 3;
  167. }
  168. /**
  169. * Contains a list of paths corresponding to corrupt files and a cookie
  170. * used for iterative calls to NameNode.listCorruptFileBlocks.
  171. *
  172. */
  173. message CorruptFileBlocksProto {
  174. repeated string files = 1;
  175. required string cookie = 2;
  176. }
  177. /**
  178. * File or Directory permision - same spec as posix
  179. */
  180. message FsPermissionProto {
  181. required uint32 perm = 1; // Actually a short - only 16bits used
  182. }
  183. /**
  184. * Types of recognized storage media.
  185. */
  186. enum StorageTypeProto {
  187. DISK = 1;
  188. SSD = 2;
  189. ARCHIVE = 3;
  190. RAM_DISK = 4;
  191. }
  192. /**
  193. * Types of recognized blocks.
  194. */
  195. enum BlockTypeProto {
  196. CONTIGUOUS = 0;
  197. STRIPED = 1;
  198. }
  199. /**
  200. * A list of storage types.
  201. */
  202. message StorageTypesProto {
  203. repeated StorageTypeProto storageTypes = 1;
  204. }
  205. /**
  206. * Block replica storage policy.
  207. */
  208. message BlockStoragePolicyProto {
  209. required uint32 policyId = 1;
  210. required string name = 2;
  211. // a list of storage types for storing the block replicas when creating a
  212. // block.
  213. required StorageTypesProto creationPolicy = 3;
  214. // A list of storage types for creation fallback storage.
  215. optional StorageTypesProto creationFallbackPolicy = 4;
  216. optional StorageTypesProto replicationFallbackPolicy = 5;
  217. }
  218. /**
  219. * A LocatedBlock gives information about a block and its location.
  220. */
  221. message LocatedBlockProto {
  222. required ExtendedBlockProto b = 1;
  223. required uint64 offset = 2; // offset of first byte of block in the file
  224. repeated DatanodeInfoProto locs = 3; // Locations ordered by proximity to client ip
  225. required bool corrupt = 4; // true if all replicas of a block are corrupt, else false
  226. // If block has few corrupt replicas, they are filtered and
  227. // their locations are not part of this object
  228. required hadoop.common.TokenProto blockToken = 5;
  229. repeated bool isCached = 6 [packed=true]; // if a location in locs is cached
  230. repeated StorageTypeProto storageTypes = 7;
  231. repeated string storageIDs = 8;
  232. // striped block related fields
  233. optional bytes blockIndices = 9; // used for striped block to indicate block index for each storage
  234. repeated hadoop.common.TokenProto blockTokens = 10; // each internal block has a block token
  235. }
  236. message DataEncryptionKeyProto {
  237. required uint32 keyId = 1;
  238. required string blockPoolId = 2;
  239. required bytes nonce = 3;
  240. required bytes encryptionKey = 4;
  241. required uint64 expiryDate = 5;
  242. optional string encryptionAlgorithm = 6;
  243. }
  244. /**
  245. * Cipher suite.
  246. */
  247. enum CipherSuiteProto {
  248. UNKNOWN = 1;
  249. AES_CTR_NOPADDING = 2;
  250. }
  251. /**
  252. * Crypto protocol version used to access encrypted files.
  253. */
  254. enum CryptoProtocolVersionProto {
  255. UNKNOWN_PROTOCOL_VERSION = 1;
  256. ENCRYPTION_ZONES = 2;
  257. }
  258. /**
  259. * Encryption information for a file.
  260. */
  261. message FileEncryptionInfoProto {
  262. required CipherSuiteProto suite = 1;
  263. required CryptoProtocolVersionProto cryptoProtocolVersion = 2;
  264. required bytes key = 3;
  265. required bytes iv = 4;
  266. required string keyName = 5;
  267. required string ezKeyVersionName = 6;
  268. }
  269. /**
  270. * Encryption information for an individual
  271. * file within an encryption zone
  272. */
  273. message PerFileEncryptionInfoProto {
  274. required bytes key = 1;
  275. required bytes iv = 2;
  276. required string ezKeyVersionName = 3;
  277. }
  278. /**
  279. * Encryption information for an encryption
  280. * zone
  281. */
  282. message ZoneEncryptionInfoProto {
  283. required CipherSuiteProto suite = 1;
  284. required CryptoProtocolVersionProto cryptoProtocolVersion = 2;
  285. required string keyName = 3;
  286. }
  287. /**
  288. * Cipher option
  289. */
  290. message CipherOptionProto {
  291. required CipherSuiteProto suite = 1;
  292. optional bytes inKey = 2;
  293. optional bytes inIv = 3;
  294. optional bytes outKey = 4;
  295. optional bytes outIv = 5;
  296. }
  297. /**
  298. * A set of file blocks and their locations.
  299. */
  300. message LocatedBlocksProto {
  301. required uint64 fileLength = 1;
  302. repeated LocatedBlockProto blocks = 2;
  303. required bool underConstruction = 3;
  304. optional LocatedBlockProto lastBlock = 4;
  305. required bool isLastBlockComplete = 5;
  306. optional FileEncryptionInfoProto fileEncryptionInfo = 6;
  307. // Optional field for erasure coding
  308. optional ErasureCodingPolicyProto ecPolicy = 7;
  309. }
  310. /**
  311. * ECSchema options entry
  312. */
  313. message ECSchemaOptionEntryProto {
  314. required string key = 1;
  315. required string value = 2;
  316. }
  317. /**
  318. * ECSchema for erasurecoding
  319. */
  320. message ECSchemaProto {
  321. required string codecName = 1;
  322. required uint32 dataUnits = 2;
  323. required uint32 parityUnits = 3;
  324. repeated ECSchemaOptionEntryProto options = 4;
  325. }
  326. message ErasureCodingPolicyProto {
  327. optional string name = 1;
  328. optional ECSchemaProto schema = 2;
  329. optional uint32 cellSize = 3;
  330. required uint32 id = 4; // Actually a byte - only 8 bits used
  331. }
  332. message AddingECPolicyResponseProto {
  333. required ErasureCodingPolicyProto policy = 1;
  334. required bool succeed = 2;
  335. optional string errorMsg = 3;
  336. }
  337. /**
  338. * Status of a file, directory or symlink
  339. * Optionally includes a file's block locations if requested by client on the rpc call.
  340. */
  341. message HdfsFileStatusProto {
  342. enum FileType {
  343. IS_DIR = 1;
  344. IS_FILE = 2;
  345. IS_SYMLINK = 3;
  346. }
  347. required FileType fileType = 1;
  348. required bytes path = 2; // local name of inode encoded java UTF8
  349. required uint64 length = 3;
  350. required FsPermissionProto permission = 4;
  351. required string owner = 5;
  352. required string group = 6;
  353. required uint64 modification_time = 7;
  354. required uint64 access_time = 8;
  355. // Optional fields for symlink
  356. optional bytes symlink = 9; // if symlink, target encoded java UTF8
  357. // Optional fields for file
  358. optional uint32 block_replication = 10 [default = 0]; // only 16bits used
  359. optional uint64 blocksize = 11 [default = 0];
  360. optional LocatedBlocksProto locations = 12; // suppled only if asked by client
  361. // Optional field for fileId
  362. optional uint64 fileId = 13 [default = 0]; // default as an invalid id
  363. optional int32 childrenNum = 14 [default = -1];
  364. // Optional field for file encryption
  365. optional FileEncryptionInfoProto fileEncryptionInfo = 15;
  366. optional uint32 storagePolicy = 16 [default = 0]; // block storage policy id
  367. // Optional field for erasure coding
  368. optional ErasureCodingPolicyProto ecPolicy = 17;
  369. }
  370. /**
  371. * Checksum algorithms/types used in HDFS
  372. * Make sure this enum's integer values match enum values' id properties defined
  373. * in org.apache.hadoop.util.DataChecksum.Type
  374. */
  375. enum ChecksumTypeProto {
  376. CHECKSUM_NULL = 0;
  377. CHECKSUM_CRC32 = 1;
  378. CHECKSUM_CRC32C = 2;
  379. }
  380. /**
  381. * HDFS Server Defaults
  382. */
  383. message FsServerDefaultsProto {
  384. required uint64 blockSize = 1;
  385. required uint32 bytesPerChecksum = 2;
  386. required uint32 writePacketSize = 3;
  387. required uint32 replication = 4; // Actually a short - only 16 bits used
  388. required uint32 fileBufferSize = 5;
  389. optional bool encryptDataTransfer = 6 [default = false];
  390. optional uint64 trashInterval = 7 [default = 0];
  391. optional ChecksumTypeProto checksumType = 8 [default = CHECKSUM_CRC32];
  392. optional string keyProviderUri = 9;
  393. optional uint32 policyId = 10 [default = 0];
  394. }
  395. /**
  396. * Directory listing
  397. */
  398. message DirectoryListingProto {
  399. repeated HdfsFileStatusProto partialListing = 1;
  400. required uint32 remainingEntries = 2;
  401. }
  402. /**
  403. * Status of a snapshottable directory: besides the normal information for
  404. * a directory status, also include snapshot quota, number of snapshots, and
  405. * the full path of the parent directory.
  406. */
  407. message SnapshottableDirectoryStatusProto {
  408. required HdfsFileStatusProto dirStatus = 1;
  409. // Fields specific for snapshottable directory
  410. required uint32 snapshot_quota = 2;
  411. required uint32 snapshot_number = 3;
  412. required bytes parent_fullpath = 4;
  413. }
  414. /**
  415. * Snapshottable directory listing
  416. */
  417. message SnapshottableDirectoryListingProto {
  418. repeated SnapshottableDirectoryStatusProto snapshottableDirListing = 1;
  419. }
  420. /**
  421. * Snapshot diff report entry
  422. */
  423. message SnapshotDiffReportEntryProto {
  424. required bytes fullpath = 1;
  425. required string modificationLabel = 2;
  426. optional bytes targetPath = 3;
  427. }
  428. /**
  429. * Snapshot diff report
  430. */
  431. message SnapshotDiffReportProto {
  432. // full path of the directory where snapshots were taken
  433. required string snapshotRoot = 1;
  434. required string fromSnapshot = 2;
  435. required string toSnapshot = 3;
  436. repeated SnapshotDiffReportEntryProto diffReportEntries = 4;
  437. }
  438. /**
  439. * Block information
  440. *
  441. * Please be wary of adding additional fields here, since INodeFiles
  442. * need to fit in PB's default max message size of 64MB.
  443. * We restrict the max # of blocks per file
  444. * (dfs.namenode.fs-limits.max-blocks-per-file), but it's better
  445. * to avoid changing this.
  446. */
  447. message BlockProto {
  448. required uint64 blockId = 1;
  449. required uint64 genStamp = 2;
  450. optional uint64 numBytes = 3 [default = 0];
  451. }
  452. /**
  453. * Information related to a snapshot
  454. * TODO: add more information
  455. */
  456. message SnapshotInfoProto {
  457. required string snapshotName = 1;
  458. required string snapshotRoot = 2;
  459. required FsPermissionProto permission = 3;
  460. required string owner = 4;
  461. required string group = 5;
  462. required string createTime = 6;
  463. // TODO: do we need access time?
  464. }
  465. /**
  466. * Rolling upgrade status
  467. */
  468. message RollingUpgradeStatusProto {
  469. required string blockPoolId = 1;
  470. optional bool finalized = 2 [default = false];
  471. }
  472. /**
  473. * A list of storage IDs.
  474. */
  475. message StorageUuidsProto {
  476. repeated string storageUuids = 1;
  477. }
  478. /**
  479. * File access permissions mode.
  480. */
  481. enum AccessModeProto {
  482. READ = 1;
  483. WRITE = 2;
  484. COPY = 3;
  485. REPLACE = 4;
  486. }
  487. /**
  488. * Secret information for the BlockKeyProto. This is not sent on the wire as
  489. * such but is used to pack a byte array and encrypted and put in
  490. * BlockKeyProto.bytes
  491. * When adding further fields, make sure they are optional as they would
  492. * otherwise not be backwards compatible.
  493. *
  494. * Note: As part of the migration from WritableUtils based tokens (aka "legacy")
  495. * to Protocol Buffers, we use the first byte to determine the type. If the
  496. * first byte is <=0 then it is a legacy token. This means that when using
  497. * protobuf tokens, the the first field sent must have a `field_number` less
  498. * than 16 to make sure that the first byte is positive. Otherwise it could be
  499. * parsed as a legacy token. See HDFS-11026 for more discussion.
  500. */
  501. message BlockTokenSecretProto {
  502. optional uint64 expiryDate = 1;
  503. optional uint32 keyId = 2;
  504. optional string userId = 3;
  505. optional string blockPoolId = 4;
  506. optional uint64 blockId = 5;
  507. repeated AccessModeProto modes = 6;
  508. repeated StorageTypeProto storageTypes = 7;
  509. repeated string storageIds = 8;
  510. }