validation.py 15 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435
  1. from __future__ import absolute_import
  2. from __future__ import unicode_literals
  3. import json
  4. import logging
  5. import os
  6. import re
  7. import sys
  8. import six
  9. from docker.utils.ports import split_port
  10. from jsonschema import Draft4Validator
  11. from jsonschema import FormatChecker
  12. from jsonschema import RefResolver
  13. from jsonschema import ValidationError
  14. from .errors import ConfigurationError
  15. from .errors import VERSION_EXPLANATION
  16. from .sort_services import get_service_name_from_network_mode
  17. log = logging.getLogger(__name__)
  18. DOCKER_CONFIG_HINTS = {
  19. 'cpu_share': 'cpu_shares',
  20. 'add_host': 'extra_hosts',
  21. 'hosts': 'extra_hosts',
  22. 'extra_host': 'extra_hosts',
  23. 'device': 'devices',
  24. 'link': 'links',
  25. 'memory_swap': 'memswap_limit',
  26. 'port': 'ports',
  27. 'privilege': 'privileged',
  28. 'priviliged': 'privileged',
  29. 'privilige': 'privileged',
  30. 'volume': 'volumes',
  31. 'workdir': 'working_dir',
  32. }
  33. VALID_NAME_CHARS = '[a-zA-Z0-9\._\-]'
  34. VALID_EXPOSE_FORMAT = r'^\d+(\-\d+)?(\/[a-zA-Z]+)?$'
  35. @FormatChecker.cls_checks(format="ports", raises=ValidationError)
  36. def format_ports(instance):
  37. try:
  38. split_port(instance)
  39. except ValueError as e:
  40. raise ValidationError(six.text_type(e))
  41. return True
  42. @FormatChecker.cls_checks(format="expose", raises=ValidationError)
  43. def format_expose(instance):
  44. if isinstance(instance, six.string_types):
  45. if not re.match(VALID_EXPOSE_FORMAT, instance):
  46. raise ValidationError(
  47. "should be of the format 'PORT[/PROTOCOL]'")
  48. return True
  49. @FormatChecker.cls_checks(format="bool-value-in-mapping")
  50. def format_boolean_in_environment(instance):
  51. """
  52. Check if there is a boolean in the environment and display a warning.
  53. Always return True here so the validation won't raise an error.
  54. """
  55. if isinstance(instance, bool):
  56. log.warn(
  57. "There is a boolean value in the 'environment' key.\n"
  58. "Environment variables can only be strings.\n"
  59. "Please add quotes to any boolean values to make them string "
  60. "(eg, 'True', 'yes', 'N').\n"
  61. "This warning will become an error in a future release. \r\n"
  62. )
  63. return True
  64. def match_named_volumes(service_dict, project_volumes):
  65. service_volumes = service_dict.get('volumes', [])
  66. for volume_spec in service_volumes:
  67. if volume_spec.is_named_volume and volume_spec.external not in project_volumes:
  68. raise ConfigurationError(
  69. 'Named volume "{0}" is used in service "{1}" but no'
  70. ' declaration was found in the volumes section.'.format(
  71. volume_spec.repr(), service_dict.get('name')
  72. )
  73. )
  74. def python_type_to_yaml_type(type_):
  75. type_name = type(type_).__name__
  76. return {
  77. 'dict': 'mapping',
  78. 'list': 'array',
  79. 'int': 'number',
  80. 'float': 'number',
  81. 'bool': 'boolean',
  82. 'unicode': 'string',
  83. 'str': 'string',
  84. 'bytes': 'string',
  85. }.get(type_name, type_name)
  86. def validate_config_section(filename, config, section):
  87. """Validate the structure of a configuration section. This must be done
  88. before interpolation so it's separate from schema validation.
  89. """
  90. if not isinstance(config, dict):
  91. raise ConfigurationError(
  92. "In file '{filename}', {section} must be a mapping, not "
  93. "{type}.".format(
  94. filename=filename,
  95. section=section,
  96. type=anglicize_json_type(python_type_to_yaml_type(config))))
  97. for key, value in config.items():
  98. if not isinstance(key, six.string_types):
  99. raise ConfigurationError(
  100. "In file '{filename}', the {section} name {name} must be a "
  101. "quoted string, i.e. '{name}'.".format(
  102. filename=filename,
  103. section=section,
  104. name=key))
  105. if not isinstance(value, (dict, type(None))):
  106. raise ConfigurationError(
  107. "In file '{filename}', {section} '{name}' must be a mapping not "
  108. "{type}.".format(
  109. filename=filename,
  110. section=section,
  111. name=key,
  112. type=anglicize_json_type(python_type_to_yaml_type(value))))
  113. def validate_top_level_object(config_file):
  114. if not isinstance(config_file.config, dict):
  115. raise ConfigurationError(
  116. "Top level object in '{}' needs to be an object not '{}'.".format(
  117. config_file.filename,
  118. type(config_file.config)))
  119. def validate_ulimits(service_config):
  120. ulimit_config = service_config.config.get('ulimits', {})
  121. for limit_name, soft_hard_values in six.iteritems(ulimit_config):
  122. if isinstance(soft_hard_values, dict):
  123. if not soft_hard_values['soft'] <= soft_hard_values['hard']:
  124. raise ConfigurationError(
  125. "Service '{s.name}' has invalid ulimit '{ulimit}'. "
  126. "'soft' value can not be greater than 'hard' value ".format(
  127. s=service_config,
  128. ulimit=ulimit_config))
  129. def validate_extends_file_path(service_name, extends_options, filename):
  130. """
  131. The service to be extended must either be defined in the config key 'file',
  132. or within 'filename'.
  133. """
  134. error_prefix = "Invalid 'extends' configuration for %s:" % service_name
  135. if 'file' not in extends_options and filename is None:
  136. raise ConfigurationError(
  137. "%s you need to specify a 'file', e.g. 'file: something.yml'" % error_prefix
  138. )
  139. def validate_network_mode(service_config, service_names):
  140. network_mode = service_config.config.get('network_mode')
  141. if not network_mode:
  142. return
  143. if 'networks' in service_config.config:
  144. raise ConfigurationError("'network_mode' and 'networks' cannot be combined")
  145. dependency = get_service_name_from_network_mode(network_mode)
  146. if not dependency:
  147. return
  148. if dependency not in service_names:
  149. raise ConfigurationError(
  150. "Service '{s.name}' uses the network stack of service '{dep}' which "
  151. "is undefined.".format(s=service_config, dep=dependency))
  152. def validate_depends_on(service_config, service_names):
  153. for dependency in service_config.config.get('depends_on', []):
  154. if dependency not in service_names:
  155. raise ConfigurationError(
  156. "Service '{s.name}' depends on service '{dep}' which is "
  157. "undefined.".format(s=service_config, dep=dependency))
  158. def get_unsupported_config_msg(path, error_key):
  159. msg = "Unsupported config option for {}: '{}'".format(path_string(path), error_key)
  160. if error_key in DOCKER_CONFIG_HINTS:
  161. msg += " (did you mean '{}'?)".format(DOCKER_CONFIG_HINTS[error_key])
  162. return msg
  163. def anglicize_json_type(json_type):
  164. if json_type.startswith(('a', 'e', 'i', 'o', 'u')):
  165. return 'an ' + json_type
  166. return 'a ' + json_type
  167. def is_service_dict_schema(schema_id):
  168. return schema_id == 'fields_schema_v1.json' or schema_id == '#/properties/services'
  169. def handle_error_for_schema_with_id(error, path):
  170. schema_id = error.schema['id']
  171. if is_service_dict_schema(schema_id) and error.validator == 'additionalProperties':
  172. return "Invalid service name '{}' - only {} characters are allowed".format(
  173. # The service_name is the key to the json object
  174. list(error.instance)[0],
  175. VALID_NAME_CHARS)
  176. if schema_id == '#/definitions/constraints':
  177. # Build context could in 'build' or 'build.context' and dockerfile could be
  178. # in 'dockerfile' or 'build.dockerfile'
  179. context = False
  180. dockerfile = 'dockerfile' in error.instance
  181. if 'build' in error.instance:
  182. if isinstance(error.instance['build'], six.string_types):
  183. context = True
  184. else:
  185. context = 'context' in error.instance['build']
  186. dockerfile = dockerfile or 'dockerfile' in error.instance['build']
  187. # TODO: only applies to v1
  188. if 'image' in error.instance and context:
  189. return (
  190. "{} has both an image and build path specified. "
  191. "A service can either be built to image or use an existing "
  192. "image, not both.".format(path_string(path)))
  193. if 'image' not in error.instance and not context:
  194. return (
  195. "{} has neither an image nor a build path specified. "
  196. "At least one must be provided.".format(path_string(path)))
  197. # TODO: only applies to v1
  198. if 'image' in error.instance and dockerfile:
  199. return (
  200. "{} has both an image and alternate Dockerfile. "
  201. "A service can either be built to image or use an existing "
  202. "image, not both.".format(path_string(path)))
  203. if error.validator == 'additionalProperties':
  204. if schema_id == '#/definitions/service':
  205. invalid_config_key = parse_key_from_error_msg(error)
  206. return get_unsupported_config_msg(path, invalid_config_key)
  207. if not error.path:
  208. return '{}\n{}'.format(error.message, VERSION_EXPLANATION)
  209. def handle_generic_service_error(error, path):
  210. msg_format = None
  211. error_msg = error.message
  212. if error.validator == 'oneOf':
  213. msg_format = "{path} {msg}"
  214. config_key, error_msg = _parse_oneof_validator(error)
  215. if config_key:
  216. path.append(config_key)
  217. elif error.validator == 'type':
  218. msg_format = "{path} contains an invalid type, it should be {msg}"
  219. error_msg = _parse_valid_types_from_validator(error.validator_value)
  220. elif error.validator == 'required':
  221. error_msg = ", ".join(error.validator_value)
  222. msg_format = "{path} is invalid, {msg} is required."
  223. elif error.validator == 'dependencies':
  224. config_key = list(error.validator_value.keys())[0]
  225. required_keys = ",".join(error.validator_value[config_key])
  226. msg_format = "{path} is invalid: {msg}"
  227. path.append(config_key)
  228. error_msg = "when defining '{}' you must set '{}' as well".format(
  229. config_key,
  230. required_keys)
  231. elif error.cause:
  232. error_msg = six.text_type(error.cause)
  233. msg_format = "{path} is invalid: {msg}"
  234. elif error.path:
  235. msg_format = "{path} value {msg}"
  236. if msg_format:
  237. return msg_format.format(path=path_string(path), msg=error_msg)
  238. return error.message
  239. def parse_key_from_error_msg(error):
  240. return error.message.split("'")[1]
  241. def path_string(path):
  242. return ".".join(c for c in path if isinstance(c, six.string_types))
  243. def _parse_valid_types_from_validator(validator):
  244. """A validator value can be either an array of valid types or a string of
  245. a valid type. Parse the valid types and prefix with the correct article.
  246. """
  247. if not isinstance(validator, list):
  248. return anglicize_json_type(validator)
  249. if len(validator) == 1:
  250. return anglicize_json_type(validator[0])
  251. return "{}, or {}".format(
  252. ", ".join([anglicize_json_type(validator[0])] + validator[1:-1]),
  253. anglicize_json_type(validator[-1]))
  254. def _parse_oneof_validator(error):
  255. """oneOf has multiple schemas, so we need to reason about which schema, sub
  256. schema or constraint the validation is failing on.
  257. Inspecting the context value of a ValidationError gives us information about
  258. which sub schema failed and which kind of error it is.
  259. """
  260. types = []
  261. for context in error.context:
  262. if context.validator == 'required':
  263. return (None, context.message)
  264. if context.validator == 'additionalProperties':
  265. invalid_config_key = parse_key_from_error_msg(context)
  266. return (None, "contains unsupported option: '{}'".format(invalid_config_key))
  267. if context.path:
  268. return (
  269. path_string(context.path),
  270. "contains {}, which is an invalid type, it should be {}".format(
  271. json.dumps(context.instance),
  272. _parse_valid_types_from_validator(context.validator_value)),
  273. )
  274. if context.validator == 'uniqueItems':
  275. return (
  276. None,
  277. "contains non unique items, please remove duplicates from {}".format(
  278. context.instance),
  279. )
  280. if context.validator == 'type':
  281. types.append(context.validator_value)
  282. valid_types = _parse_valid_types_from_validator(types)
  283. return (None, "contains an invalid type, it should be {}".format(valid_types))
  284. def process_errors(errors, path_prefix=None):
  285. """jsonschema gives us an error tree full of information to explain what has
  286. gone wrong. Process each error and pull out relevant information and re-write
  287. helpful error messages that are relevant.
  288. """
  289. path_prefix = path_prefix or []
  290. def format_error_message(error):
  291. path = path_prefix + list(error.path)
  292. if 'id' in error.schema:
  293. error_msg = handle_error_for_schema_with_id(error, path)
  294. if error_msg:
  295. return error_msg
  296. return handle_generic_service_error(error, path)
  297. return '\n'.join(format_error_message(error) for error in errors)
  298. def validate_against_fields_schema(config_file):
  299. schema_filename = "fields_schema_v{0}.json".format(config_file.version)
  300. _validate_against_schema(
  301. config_file.config,
  302. schema_filename,
  303. format_checker=["ports", "expose", "bool-value-in-mapping"],
  304. filename=config_file.filename)
  305. def validate_against_service_schema(config, service_name, version):
  306. _validate_against_schema(
  307. config,
  308. "service_schema_v{0}.json".format(version),
  309. format_checker=["ports"],
  310. path_prefix=[service_name])
  311. def _validate_against_schema(
  312. config,
  313. schema_filename,
  314. format_checker=(),
  315. path_prefix=None,
  316. filename=None):
  317. config_source_dir = os.path.dirname(os.path.abspath(__file__))
  318. if sys.platform == "win32":
  319. file_pre_fix = "///"
  320. config_source_dir = config_source_dir.replace('\\', '/')
  321. else:
  322. file_pre_fix = "//"
  323. resolver_full_path = "file:{}{}/".format(file_pre_fix, config_source_dir)
  324. schema_file = os.path.join(config_source_dir, schema_filename)
  325. with open(schema_file, "r") as schema_fh:
  326. schema = json.load(schema_fh)
  327. resolver = RefResolver(resolver_full_path, schema)
  328. validation_output = Draft4Validator(
  329. schema,
  330. resolver=resolver,
  331. format_checker=FormatChecker(format_checker))
  332. errors = [error for error in sorted(validation_output.iter_errors(config), key=str)]
  333. if not errors:
  334. return
  335. error_msg = process_errors(errors, path_prefix=path_prefix)
  336. file_msg = " in file '{}'".format(filename) if filename else ''
  337. raise ConfigurationError("Validation failed{}, reason(s):\n{}".format(
  338. file_msg,
  339. error_msg))