project.py 2.8 KB

12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970717273747576777879808182838485
  1. import os
  2. from six.moves import cPickle as pickle
  3. import warnings
  4. from importlib import import_module
  5. from os.path import join, dirname, abspath, isabs, exists
  6. from scrapy.utils.conf import closest_scrapy_cfg, get_config, init_env
  7. from scrapy.settings import Settings
  8. from scrapy.exceptions import NotConfigured
  9. from scrapy.exceptions import ScrapyDeprecationWarning
  10. ENVVAR = 'SCRAPY_SETTINGS_MODULE'
  11. DATADIR_CFG_SECTION = 'datadir'
  12. def inside_project():
  13. scrapy_module = os.environ.get('SCRAPY_SETTINGS_MODULE')
  14. if scrapy_module is not None:
  15. try:
  16. import_module(scrapy_module)
  17. except ImportError as exc:
  18. warnings.warn("Cannot import scrapy settings module %s: %s" % (scrapy_module, exc))
  19. else:
  20. return True
  21. return bool(closest_scrapy_cfg())
  22. def project_data_dir(project='default'):
  23. """Return the current project data dir, creating it if it doesn't exist"""
  24. if not inside_project():
  25. raise NotConfigured("Not inside a project")
  26. cfg = get_config()
  27. if cfg.has_option(DATADIR_CFG_SECTION, project):
  28. d = cfg.get(DATADIR_CFG_SECTION, project)
  29. else:
  30. scrapy_cfg = closest_scrapy_cfg()
  31. if not scrapy_cfg:
  32. raise NotConfigured("Unable to find scrapy.cfg file to infer project data dir")
  33. d = abspath(join(dirname(scrapy_cfg), '.scrapy'))
  34. if not exists(d):
  35. os.makedirs(d)
  36. return d
  37. def data_path(path, createdir=False):
  38. """
  39. Return the given path joined with the .scrapy data directory.
  40. If given an absolute path, return it unmodified.
  41. """
  42. if not isabs(path):
  43. if inside_project():
  44. path = join(project_data_dir(), path)
  45. else:
  46. path = join('.scrapy', path)
  47. if createdir and not exists(path):
  48. os.makedirs(path)
  49. return path
  50. def get_project_settings():
  51. if ENVVAR not in os.environ:
  52. project = os.environ.get('SCRAPY_PROJECT', 'default')
  53. init_env(project)
  54. settings = Settings()
  55. settings_module_path = os.environ.get(ENVVAR)
  56. if settings_module_path:
  57. settings.setmodule(settings_module_path, priority='project')
  58. # XXX: remove this hack
  59. pickled_settings = os.environ.get("SCRAPY_PICKLED_SETTINGS_TO_OVERRIDE")
  60. if pickled_settings:
  61. warnings.warn("Use of environment variable "
  62. "'SCRAPY_PICKLED_SETTINGS_TO_OVERRIDE' "
  63. "is deprecated.", ScrapyDeprecationWarning)
  64. settings.setdict(pickle.loads(pickled_settings), priority='project')
  65. # XXX: deprecate and remove this functionality
  66. env_overrides = {k[7:]: v for k, v in os.environ.items() if
  67. k.startswith('SCRAPY_')}
  68. if env_overrides:
  69. settings.setdict(env_overrides, priority='project')
  70. return settings