# # Licensed to the Apache Software Foundation (ASF) under one # or more contributor license agreements. See the NOTICE file # distributed with this work for additional information # regarding copyright ownership. The ASF licenses this file # to you under the Apache License, Version 2.0 (the # "License"); you may not use this file except in compliance # with the License. You may obtain a copy of the License at # # http://www.apache.org/licenses/LICENSE-2.0 # # Unless required by applicable law or agreed to in writing, # software distributed under the License is distributed on an # "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY # KIND, either express or implied. See the License for the # specific language governing permissions and limitations # under the License. """Setup.py for the Backport packages of Airflow project.""" import io import itertools import json import logging import os import sys import textwrap from importlib import util from os.path import dirname from shutil import copyfile, copytree, rmtree from typing import Dict, List from setuptools import Command, find_packages, setup as setuptools_setup logger = logging.getLogger(__name__) # Kept manually in sync with airflow.__version__ # noinspection PyUnresolvedReferences spec = util.spec_from_file_location("airflow.version", os.path.join('airflow', 'version.py')) # noinspection PyUnresolvedReferences mod = util.module_from_spec(spec) spec.loader.exec_module(mod) # type: ignore version = mod.version # type: ignore PY3 = sys.version_info[0] == 3 # noinspection PyUnboundLocalVariable try: with io.open('README.md', encoding='utf-8') as f: long_description = f.read() except FileNotFoundError: long_description = '' class CleanCommand(Command): """ Command to tidy up the project root. Registered as cmdclass in setup() so it can be called with ``python setup.py extra_clean``. """ description = "Tidy up the project root" user_options = [] # type: List[str] def initialize_options(self): """Set default values for options.""" def finalize_options(self): """Set final values for options.""" # noinspection PyMethodMayBeStatic def run(self): """Run command to remove temporary files and directories.""" os.chdir(dirname(__file__)) os.system('rm -vrf ./build ./dist ./*.pyc ./*.tgz ./*.egg-info') sys.path.append(os.path.join(dirname(__file__), os.pardir)) import setup # From AIRFLOW_SOURCES/setup.py # noqa # isort:skip PROVIDERS_DEPENDENCIES: Dict[str, List[str]] = { "amazon": setup.aws, "apache.cassandra": setup.cassandra, "apache.druid": setup.druid, "apache.hdfs": setup.hdfs, "apache.hive": setup.hive, "apache.livy": [], "apache.pig": [], "apache.pinot": setup.pinot, "apache.spark": [], "apache.sqoop": [], "celery": setup.celery, "cloudant": setup.cloudant, "cncf.kubernetes": setup.kubernetes, "databricks": setup.databricks, "datadog": setup.datadog, "dingding": [], "discord": [], "docker": setup.docker, "email": [], "elasticsearch": [], "ftp": [], "google": setup.gcp, "grpc": setup.grpc, "http": [], "imap": [], "jdbc": setup.jdbc, "jenkins": setup.jenkins, "jira": setup.jira, "microsoft.azure": setup.azure, "microsoft.mssql": setup.mssql, "microsoft.winrm": setup.winrm, "mongo": setup.mongo, "mysql": setup.mysql, "odbc": setup.odbc, "openfaas": [], "opsgenie": [], "oracle": setup.oracle, "pagerduty": setup.pagerduty, "papermill": setup.papermill, "postgres": setup.postgres, "presto": setup.presto, "qubole": setup.qds, "redis": setup.redis, "salesforce": setup.salesforce, "samba": setup.samba, "segment": setup.segment, "sftp": setup.ssh, "slack": setup.slack, "snowflake": setup.snowflake, "sqlite": [], "ssh": setup.ssh, "vertica": setup.vertica, "yandex": [], "zendesk": setup.zendesk, } DEPENDENCIES_JSON_FILE = os.path.join(os.pardir, "airflow", "providers", "dependencies.json") def change_import_paths_to_deprecated(): from bowler import LN, TOKEN, Capture, Filename, Query from fissix.pytree import Leaf def remove_tags_modifier(node: LN, capture: Capture, filename: Filename) -> None: for node in capture['function_arguments'][0].post_order(): if isinstance(node, Leaf) and node.value == "tags" and node.type == TOKEN.NAME: if node.parent.next_sibling and node.parent.next_sibling.value == ",": node.parent.next_sibling.remove() node.parent.remove() def pure_airflow_models_filter(node: LN, capture: Capture, filename: Filename) -> bool: """Check if select is exactly [airflow, . , models]""" return len([ch for ch in node.children[1].leaves()]) == 3 changes = [ ("airflow.operators.bash", "airflow.operators.bash_operator"), ("airflow.operators.python", "airflow.operators.python_operator"), ("airflow.utils.session", "airflow.utils.db"), ] qry = Query() for new, old in changes: qry.select_module(new).rename(old) # Move and refactor imports for Dataflow copyfile( os.path.join(dirname(__file__), os.pardir, "airflow", "utils", "python_virtualenv.py"), os.path.join(dirname(__file__), "airflow", "providers", "google", "cloud", "utils", "python_virtualenv.py" ) ) ( qry .select_module("airflow.utils.python_virtualenv") .rename("airflow.providers.google.cloud.utils.python_virtualenv") ) copyfile( os.path.join(dirname(__file__), os.pardir, "airflow", "utils", "process_utils.py"), os.path.join(dirname(__file__), "airflow", "providers", "google", "cloud", "utils", "process_utils.py" ) ) ( qry .select_module("airflow.utils.process_utils") .rename("airflow.providers.google.cloud.utils.process_utils") ) # Remove tags qry.select_method("DAG").is_call().modify(remove_tags_modifier) # Fix KubernetesPodOperator imports to use old path qry.select_module( "airflow.providers.cncf.kubernetes.operators.kubernetes_pod").rename( "airflow.contrib.operators.kubernetes_pod_operator" ) # Fix BaseOperatorLinks imports files = r"bigquery\.py|mlengine\.py" # noqa qry.select_module("airflow.models").is_filename(include=files).filter(pure_airflow_models_filter).rename( "airflow.models.baseoperator") qry.execute(write=True, silent=False, interactive=False) def copy_provider_sources(): build_dir = os.path.join(dirname(__file__), "build") if os.path.isdir(build_dir): rmtree(build_dir) package_providers_dir = os.path.join(dirname(__file__), "airflow", "providers") if os.path.isdir(package_providers_dir): rmtree(package_providers_dir) copytree(os.path.join(dirname(__file__), os.pardir, "airflow", "providers"), os.path.join(dirname(__file__), "airflow", "providers")) def get_provider_package_name(provider_module: str): return "apache-airflow-providers-" + provider_module.replace(".", "-") def copy_and_refactor_sources(): copy_provider_sources() change_import_paths_to_deprecated() def do_setup_package_providers(provider_module: str, deps: List[str], extras: Dict[str, List[str]]): setup.write_version() provider_package_name = get_provider_package_name(provider_module) package_name = f'{provider_package_name}' if provider_module != "providers" \ else f'apache-airflow-providers' package_prefix = f'airflow.providers.{provider_module}' if provider_module != 'providers' \ else 'airflow.providers' found_packages = find_packages() found_packages = [package for package in found_packages if package.startswith(package_prefix)] setuptools_setup( name=package_name, description=f'Back-porting ${package_name} package for Airflow 1.10.*', long_description=f""" Back-ported {package_name} to 1.10.* series of Airflow. """, long_description_content_type='text/markdown', license='Apache License 2.0', version='0.0.1', packages=found_packages, include_package_data=True, zip_safe=False, install_requires=['apache-airflow~=1.10'] + deps, extras_require=extras, classifiers=[ 'Development Status :: 5 - Production/Stable', 'Environment :: Console', 'Intended Audience :: Developers', 'Intended Audience :: System Administrators', 'License :: OSI Approved :: Apache Software License', 'Programming Language :: Python :: 3.6', 'Programming Language :: Python :: 3.7', 'Topic :: System :: Monitoring', ], python_requires='>=3.6', ) def find_package_dependencies(package: str) -> List[str]: """Finds dependencies for the packages""" if package != 'providers': return PROVIDERS_DEPENDENCIES[package] else: return list(itertools.chain(*PROVIDERS_DEPENDENCIES.values())) def find_package_extras(package: str) -> Dict[str, List[str]]: """Finds extras for the packages""" if package == 'providers': return {} with open(DEPENDENCIES_JSON_FILE, "rt") as dependencies_file: cross_provider_dependencies: Dict[str, List[str]] = json.load(dependencies_file) extras_dict = {module: [get_provider_package_name(module)] for module in cross_provider_dependencies[package]} \ if cross_provider_dependencies.get(package) else {} return extras_dict def get_provider_packages(): """Returns all packages available in providers""" packages = list(PROVIDERS_DEPENDENCIES) return ['providers'] + packages def usage(): print() print("You should provide PACKAGE as first of the setup.py arguments") packages = get_provider_packages() out = "" for package in packages: out += f"{package} " out_array = textwrap.wrap(out, 80) print(f"Available packages: ") print() for text in out_array: print(text) print() print("You can see all packages configured by specifying list-backport-packages as first argument") if __name__ == "__main__": LIST_BACKPORT_PACKAGES = "list-backport-packages" possible_first_params = get_provider_packages() possible_first_params.append(LIST_BACKPORT_PACKAGES) if len(sys.argv) == 1: print() print("ERROR! Missing first param") print() usage() elif sys.argv[1] == "prepare": print("Copying sources and doing refactor") copy_and_refactor_sources() elif sys.argv[1] not in possible_first_params: print() print(f"ERROR! Wrong first param: {sys.argv[1]}") print() usage() elif "--help" in sys.argv or "-h" in sys.argv or \ len(sys.argv) < 2: usage() elif len(sys.argv) > 1 and sys.argv[1] == LIST_BACKPORT_PACKAGES: for key in PROVIDERS_DEPENDENCIES: print(key) else: provider_package = sys.argv[1] if provider_package not in get_provider_packages(): raise Exception(f"The package {provider_package} is not a backport package. " f"Use one of {get_provider_packages()}") del sys.argv[1] print(f"Building backport package: {provider_package}") dependencies = find_package_dependencies(package=provider_package) do_setup_package_providers(provider_module=provider_package, deps=dependencies, extras=find_package_extras(provider_package))