install_packages.py 18 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434
  1. #!/usr/bin/env python
  2. """
  3. Licensed to the Apache Software Foundation (ASF) under one
  4. or more contributor license agreements. See the NOTICE file
  5. distributed with this work for additional information
  6. regarding copyright ownership. The ASF licenses this file
  7. to you under the Apache License, Version 2.0 (the
  8. "License"); you may not use this file except in compliance
  9. with the License. You may obtain a copy of the License at
  10. http://www.apache.org/licenses/LICENSE-2.0
  11. Unless required by applicable law or agreed to in writing, software
  12. distributed under the License is distributed on an "AS IS" BASIS,
  13. WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  14. See the License for the specific language governing permissions and
  15. limitations under the License.
  16. Ambari Agent
  17. """
  18. import os
  19. import signal
  20. import re
  21. import os.path
  22. import ambari_simplejson as json # simplejson is much faster comparing to Python 2.6 json module and has the same functions set.
  23. from resource_management import *
  24. import resource_management
  25. from resource_management.libraries.functions.list_ambari_managed_repos import list_ambari_managed_repos
  26. from ambari_commons.os_check import OSCheck, OSConst
  27. from resource_management.libraries.functions.packages_analyzer import allInstalledPackages
  28. from resource_management.libraries.functions import conf_select
  29. from resource_management.libraries.functions.hdp_select import get_hdp_versions
  30. from resource_management.libraries.functions.version import compare_versions, format_hdp_stack_version
  31. from resource_management.libraries.functions.repo_version_history \
  32. import read_actual_version_from_history_file, write_actual_version_to_history_file, REPO_VERSION_HISTORY_FILE
  33. from resource_management.core.logger import Logger
  34. class InstallPackages(Script):
  35. """
  36. This script is a part of Rolling Upgrade workflow and is described at
  37. appropriate design doc.
  38. It installs repositories to the node and then installs packages.
  39. For now, repositories are installed into individual files.
  40. """
  41. UBUNTU_REPO_COMPONENTS_POSTFIX = ["main"]
  42. REPO_FILE_NAME_PREFIX = 'HDP-'
  43. STACK_TO_ROOT_FOLDER = {"HDP": "/usr/hdp"}
  44. def actionexecute(self, env):
  45. num_errors = 0
  46. # Parse parameters
  47. config = Script.get_config()
  48. repo_rhel_suse = config['configurations']['cluster-env']['repo_suse_rhel_template']
  49. repo_ubuntu = config['configurations']['cluster-env']['repo_ubuntu_template']
  50. template = repo_rhel_suse if OSCheck.is_redhat_family() or OSCheck.is_suse_family() else repo_ubuntu
  51. # Handle a SIGTERM and SIGINT gracefully
  52. signal.signal(signal.SIGTERM, self.abort_handler)
  53. signal.signal(signal.SIGINT, self.abort_handler)
  54. # Select dict that contains parameters
  55. try:
  56. self.repository_version = config['roleParams']['repository_version']
  57. base_urls = json.loads(config['roleParams']['base_urls'])
  58. package_list = json.loads(config['roleParams']['package_list'])
  59. stack_id = config['roleParams']['stack_id']
  60. except KeyError:
  61. # Last try
  62. self.repository_version = config['commandParams']['repository_version']
  63. base_urls = json.loads(config['commandParams']['base_urls'])
  64. package_list = json.loads(config['commandParams']['package_list'])
  65. stack_id = config['commandParams']['stack_id']
  66. # current stack information
  67. self.current_hdp_stack_version = None
  68. if 'stack_version' in config['hostLevelParams']:
  69. current_stack_version_unformatted = str(config['hostLevelParams']['stack_version'])
  70. self.current_hdp_stack_version = format_hdp_stack_version(current_stack_version_unformatted)
  71. stack_name = None
  72. self.stack_root_folder = None
  73. if stack_id and "-" in stack_id:
  74. stack_split = stack_id.split("-")
  75. if len(stack_split) == 2:
  76. stack_name = stack_split[0].upper()
  77. if stack_name in self.STACK_TO_ROOT_FOLDER:
  78. self.stack_root_folder = self.STACK_TO_ROOT_FOLDER[stack_name]
  79. if self.stack_root_folder is None:
  80. raise Fail("Cannot determine the stack's root directory by parsing the stack_id property, {0}".format(str(stack_id)))
  81. if self.repository_version is None:
  82. raise Fail("Cannot determine the repository version to install")
  83. self.repository_version = self.repository_version.strip()
  84. # Install/update repositories
  85. installed_repositories = []
  86. self.current_repositories = []
  87. self.current_repo_files = set()
  88. # Enable base system repositories
  89. # We don't need that for RHEL family, because we leave all repos enabled
  90. # except disabled HDP* ones
  91. if OSCheck.is_suse_family():
  92. self.current_repositories.append('base')
  93. elif OSCheck.is_ubuntu_family():
  94. self.current_repo_files.add('base')
  95. Logger.info("Will install packages for repository version {0}".format(self.repository_version))
  96. try:
  97. append_to_file = False
  98. for url_info in base_urls:
  99. repo_name, repo_file = self.install_repository(url_info, append_to_file, template)
  100. self.current_repositories.append(repo_name)
  101. self.current_repo_files.add(repo_file)
  102. append_to_file = True
  103. installed_repositories = list_ambari_managed_repos()
  104. except Exception, err:
  105. Logger.logger.exception("Cannot distribute repositories. Error: {0}".format(str(err)))
  106. num_errors += 1
  107. # Build structured output with initial values
  108. self.structured_output = {
  109. 'ambari_repositories': installed_repositories,
  110. 'installed_repository_version': self.repository_version,
  111. 'stack_id': stack_id,
  112. 'package_installation_result': 'FAIL'
  113. }
  114. self.put_structured_out(self.structured_output)
  115. if num_errors > 0:
  116. raise Fail("Failed to distribute repositories/install packages")
  117. # Initial list of versions, used to compute the new version installed
  118. self.old_versions = get_hdp_versions(self.stack_root_folder)
  119. try:
  120. is_package_install_successful = False
  121. ret_code = self.install_packages(package_list)
  122. if ret_code == 0:
  123. self.structured_output['package_installation_result'] = 'SUCCESS'
  124. self.put_structured_out(self.structured_output)
  125. is_package_install_successful = True
  126. else:
  127. num_errors += 1
  128. except Exception, err:
  129. num_errors += 1
  130. Logger.logger.exception("Could not install packages. Error: {0}".format(str(err)))
  131. # Provide correct exit code
  132. if num_errors > 0:
  133. raise Fail("Failed to distribute repositories/install packages")
  134. # if installing a version of HDP that needs some symlink love, then create them
  135. if is_package_install_successful and 'actual_version' in self.structured_output:
  136. self._create_config_links_if_necessary(stack_id, self.structured_output['actual_version'])
  137. def _create_config_links_if_necessary(self, stack_id, stack_version):
  138. """
  139. Sets up the required structure for /etc/<component>/conf symlinks and /usr/hdp/current
  140. configuration symlinks IFF the current stack is < HDP 2.3+ and the new stack is >= HDP 2.3
  141. stack_id: stack id, ie HDP-2.3
  142. stack_version: version to set, ie 2.3.0.0-1234
  143. """
  144. if stack_id is None:
  145. Logger.info("Cannot create config links when stack_id is not defined")
  146. return
  147. args = stack_id.upper().split('-')
  148. if len(args) != 2:
  149. Logger.info("Unrecognized stack id {0}, cannot create config links".format(stack_id))
  150. return
  151. if args[0] != "HDP":
  152. Logger.info("Unrecognized stack name {0}, cannot create config links".format(args[0]))
  153. if compare_versions(format_hdp_stack_version(args[1]), "2.3.0.0") < 0:
  154. Logger.info("Configuration symlinks are not needed for {0}, only HDP-2.3+".format(stack_version))
  155. return
  156. for package_name, directories in conf_select.PACKAGE_DIRS.iteritems():
  157. # if already on HDP 2.3, then we should skip making conf.backup folders
  158. if self.current_hdp_stack_version and compare_versions(self.current_hdp_stack_version, '2.3') >= 0:
  159. Logger.info("The current cluster stack of {0} does not require backing up configurations; "
  160. "only conf-select versioned config directories will be created.".format(stack_version))
  161. # only link configs for all known packages
  162. conf_select.link_component_conf_to_versioned_config(package_name, stack_version)
  163. else:
  164. # link configs and create conf.backup folders for all known packages
  165. conf_select.convert_conf_directories_to_symlinks(package_name, stack_version, directories,
  166. skip_existing_links = False, link_to = "backup")
  167. def compute_actual_version(self):
  168. """
  169. After packages are installed, determine what the new actual version is.
  170. """
  171. # If the repo contains a build number, optimistically assume it to be the actual_version. It will get changed
  172. # to correct value if it is not
  173. self.actual_version = None
  174. self.repo_version_with_build_number = None
  175. if self.repository_version:
  176. m = re.search("[\d\.]+-\d+", self.repository_version)
  177. if m:
  178. # Contains a build number
  179. self.repo_version_with_build_number = self.repository_version
  180. self.structured_output['actual_version'] = self.repo_version_with_build_number # This is the best value known so far.
  181. self.put_structured_out(self.structured_output)
  182. Logger.info("Attempting to determine actual version with build number.")
  183. Logger.info("Old versions: {0}".format(self.old_versions))
  184. new_versions = get_hdp_versions(self.stack_root_folder)
  185. Logger.info("New versions: {0}".format(new_versions))
  186. deltas = set(new_versions) - set(self.old_versions)
  187. Logger.info("Deltas: {0}".format(deltas))
  188. # Get version without build number
  189. normalized_repo_version = self.repository_version.split('-')[0]
  190. if 1 == len(deltas):
  191. self.actual_version = next(iter(deltas)).strip()
  192. self.structured_output['actual_version'] = self.actual_version
  193. self.put_structured_out(self.structured_output)
  194. write_actual_version_to_history_file(normalized_repo_version, self.actual_version)
  195. Logger.info(
  196. "Found actual version {0} by checking the delta between versions before and after installing packages".format(
  197. self.actual_version))
  198. else:
  199. # If the first install attempt does a partial install and is unable to report this to the server,
  200. # then a subsequent attempt will report an empty delta. For this reason, we search for a best fit version for the repo version
  201. Logger.info("Cannot determine actual version installed by checking the delta between versions "
  202. "before and after installing package")
  203. Logger.info("Will try to find for the actual version by searching for best possible match in the list of versions installed")
  204. self.actual_version = self.find_best_fit_version(new_versions, self.repository_version)
  205. if self.actual_version is not None:
  206. self.actual_version = self.actual_version.strip()
  207. self.structured_output['actual_version'] = self.actual_version
  208. self.put_structured_out(self.structured_output)
  209. Logger.info("Found actual version {0} by searching for best possible match".format(self.actual_version))
  210. else:
  211. msg = "Could not determine actual version installed. Try reinstalling packages again."
  212. raise Fail(msg)
  213. def check_partial_install(self):
  214. """
  215. If an installation did not complete successfully, check if installation was partially complete and
  216. log the partially completed version to REPO_VERSION_HISTORY_FILE.
  217. :return:
  218. """
  219. Logger.info("Installation of packages failed. Checking if installation was partially complete")
  220. Logger.info("Old versions: {0}".format(self.old_versions))
  221. new_versions = get_hdp_versions(self.stack_root_folder)
  222. Logger.info("New versions: {0}".format(new_versions))
  223. deltas = set(new_versions) - set(self.old_versions)
  224. Logger.info("Deltas: {0}".format(deltas))
  225. # Get version without build number
  226. normalized_repo_version = self.repository_version.split('-')[0]
  227. if 1 == len(deltas):
  228. # Some packages were installed successfully. Log this version to REPO_VERSION_HISTORY_FILE
  229. partial_install_version = next(iter(deltas)).strip()
  230. write_actual_version_to_history_file(normalized_repo_version, partial_install_version)
  231. Logger.info("Version {0} was partially installed. ".format(partial_install_version))
  232. def find_best_fit_version(self, versions, repo_version):
  233. """
  234. Given a list of installed versions and a repo version, search for a version that best fits the repo version
  235. If the repo version is found in the list of installed versions, return the repo version itself.
  236. If the repo version is not found in the list of installed versions
  237. normalize the repo version and use the REPO_VERSION_HISTORY_FILE file to search the list.
  238. :param versions: List of versions installed
  239. :param repo_version: Repo version to search
  240. :return: Matching version, None if no match was found.
  241. """
  242. if versions is None or repo_version is None:
  243. return None
  244. build_num_match = re.search("[\d\.]+-\d+", repo_version)
  245. if build_num_match and repo_version in versions:
  246. # If repo version has build number and is found in the list of versions, return it as the matching version
  247. Logger.info("Best Fit Version: Resolved from repo version with valid build number: {0}".format(repo_version))
  248. return repo_version
  249. # Get version without build number
  250. normalized_repo_version = repo_version.split('-')[0]
  251. # Find all versions that match the normalized repo version
  252. match_versions = filter(lambda x: x.startswith(normalized_repo_version), versions)
  253. if match_versions:
  254. if len(match_versions) == 1:
  255. # Resolved without conflicts
  256. Logger.info("Best Fit Version: Resolved from normalized repo version without conflicts: {0}".format(match_versions[0]))
  257. return match_versions[0]
  258. # Resolve conflicts using REPO_VERSION_HISTORY_FILE
  259. history_version = read_actual_version_from_history_file(normalized_repo_version)
  260. # Validate history version retrieved is valid
  261. if history_version in match_versions:
  262. Logger.info("Best Fit Version: Resolved from normalized repo version using {0}: {1}".format(REPO_VERSION_HISTORY_FILE, history_version))
  263. return history_version
  264. # No matching version
  265. return None
  266. def install_packages(self, package_list):
  267. """
  268. Actually install the packages using the package manager.
  269. :param package_list: List of package names to install
  270. :return: Returns 0 if no errors were found, and 1 otherwise.
  271. """
  272. ret_code = 0
  273. # Install packages
  274. packages_were_checked = False
  275. try:
  276. Package("hdp-select",
  277. action="upgrade",
  278. )
  279. packages_installed_before = []
  280. allInstalledPackages(packages_installed_before)
  281. packages_installed_before = [package[0] for package in packages_installed_before]
  282. packages_were_checked = True
  283. filtered_package_list = self.filter_package_list(package_list)
  284. for package in filtered_package_list:
  285. name = self.format_package_name(package['name'])
  286. Package(name,
  287. action="upgrade" # this enables upgrading non-versioned packages, despite the fact they exist. Needed by 'mahout' which is non-version but have to be updated
  288. )
  289. except Exception, err:
  290. ret_code = 1
  291. Logger.logger.exception("Package Manager failed to install packages. Error: {0}".format(str(err)))
  292. # Remove already installed packages in case of fail
  293. if packages_were_checked and packages_installed_before:
  294. packages_installed_after = []
  295. allInstalledPackages(packages_installed_after)
  296. packages_installed_after = [package[0] for package in packages_installed_after]
  297. packages_installed_before = set(packages_installed_before)
  298. new_packages_installed = [package for package in packages_installed_after if package not in packages_installed_before]
  299. if OSCheck.is_ubuntu_family():
  300. package_version_string = self.repository_version.replace('.', '-')
  301. else:
  302. package_version_string = self.repository_version.replace('-', '_')
  303. package_version_string = package_version_string.replace('.', '_')
  304. for package in new_packages_installed:
  305. if package_version_string and (package_version_string in package):
  306. Package(package, action="remove")
  307. # Compute the actual version in order to save it in structured out
  308. try:
  309. if ret_code == 0:
  310. self.compute_actual_version()
  311. else:
  312. self.check_partial_install()
  313. except Fail, err:
  314. ret_code = 1
  315. Logger.logger.exception("Failure while computing actual version. Error: {0}".format(str(err)))
  316. return ret_code
  317. def install_repository(self, url_info, append_to_file, template):
  318. repo = {
  319. 'repoName': "{0}-{1}".format(url_info['name'], self.repository_version)
  320. }
  321. if not 'baseUrl' in url_info:
  322. repo['baseurl'] = None
  323. else:
  324. repo['baseurl'] = url_info['baseUrl']
  325. if not 'mirrorsList' in url_info:
  326. repo['mirrorsList'] = None
  327. else:
  328. repo['mirrorsList'] = url_info['mirrorsList']
  329. ubuntu_components = [url_info['name']] + self.UBUNTU_REPO_COMPONENTS_POSTFIX
  330. file_name = self.REPO_FILE_NAME_PREFIX + self.repository_version
  331. Repository(repo['repoName'],
  332. action = "create",
  333. base_url = repo['baseurl'],
  334. mirror_list = repo['mirrorsList'],
  335. repo_file_name = file_name,
  336. repo_template = template,
  337. append_to_file = append_to_file,
  338. components = ubuntu_components, # ubuntu specific
  339. )
  340. return repo['repoName'], file_name
  341. def abort_handler(self, signum, frame):
  342. Logger.error("Caught signal {0}, will handle it gracefully. Compute the actual version if possible before exiting.".format(signum))
  343. self.check_partial_install()
  344. def filter_package_list(self, package_list):
  345. """
  346. Note: that we have skipUpgrade option in metainfo.xml to filter packages,
  347. as well as condition option to filter them conditionally,
  348. so use this method only if, for some reason the metainfo option cannot be used.
  349. :param package_list: original list
  350. :return: filtered package_list
  351. """
  352. filtered_package_list = []
  353. for package in package_list:
  354. if Script.check_package_condition(package):
  355. filtered_package_list.append(package)
  356. return filtered_package_list
  357. if __name__ == "__main__":
  358. InstallPackages().execute()