forked from great-expectations/great_expectations
-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathsetup.py
120 lines (106 loc) · 3.99 KB
/
setup.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
import re
from pathlib import Path
import pkg_resources
from setuptools import find_packages, setup
import versioneer
def get_extras_require():
results = {}
extra_key_mapping = {
"aws_secrets": "boto",
"azure_secrets": "azure",
"gcp": "bigquery",
"s3": "boto",
}
sqla_keys = (
"athena",
"bigquery",
"dremio",
"mssql",
"mysql",
"postgresql",
"redshift",
"snowflake",
"teradata",
"trino",
"vertica",
)
ignore_keys = (
"sqlalchemy",
"test",
"tools",
"all-contrib-expectations",
)
requirements_dir = "reqs"
rx_name_part = re.compile(r"requirements-dev-(.*).txt")
# Use Path() from pathlib so we can make this section of the code OS agnostic.
# Loop through each requirement file and verify they are named
# correctly and are in the right location.
for file_path in Path().glob(f"{requirements_dir}/*.txt"):
match = rx_name_part.match(file_path.name)
assert (
match is not None
), f"The extras requirements dir ({requirements_dir}) contains files that do not adhere to the following format: requirements-dev-*.txt"
key = match.group(1)
if key in ignore_keys:
continue
with open(file_path) as f:
parsed = [str(req) for req in pkg_resources.parse_requirements(f)]
results[key] = parsed
lite = results.pop("lite")
contrib = results.pop("contrib")
docs_test = results.pop("api-docs-test")
results["boto"] = [req for req in lite if req.startswith("boto")]
results["sqlalchemy"] = [req for req in lite if req.startswith("sqlalchemy")]
results["test"] = lite + contrib + docs_test
for new_key, existing_key in extra_key_mapping.items():
results[new_key] = results[existing_key]
for key in sqla_keys:
results[key] += results["sqlalchemy"]
results.pop("boto")
all_requirements_set = set()
[all_requirements_set.update(vals) for vals in results.values()]
results["dev"] = sorted(all_requirements_set)
return results
# Parse requirements.txt
with open("requirements.txt") as f:
required = f.read().splitlines()
long_description = "Always know what to expect from your data. (See https://github.com/great-expectations/great_expectations for full description)."
config = {
"description": "Always know what to expect from your data.",
"author": "The Great Expectations Team",
"url": "https://greatexpectations.io",
"download_url": "https://github.com/great-expectations/great_expectations",
"author_email": "[email protected]",
"version": versioneer.get_version(),
"cmdclass": versioneer.get_cmdclass(),
"install_requires": required,
"extras_require": get_extras_require(),
"packages": find_packages(
exclude=["contrib*", "docs*", "tests*", "examples*", "scripts*"]
),
"entry_points": {
"console_scripts": ["great_expectations=great_expectations.cli:main"]
},
"package_data": {"great_expectations": ["**/py.typed", "**/*.pyi"]},
"name": "great_expectations",
"long_description": long_description,
"license": "Apache-2.0",
"keywords": "data science testing pipeline data quality dataquality validation datavalidation",
"include_package_data": True,
"classifiers": [
"Development Status :: 4 - Beta",
"Intended Audience :: Developers",
"Intended Audience :: Science/Research",
"Intended Audience :: Other Audience",
"Topic :: Scientific/Engineering",
"Topic :: Software Development",
"Topic :: Software Development :: Testing",
"License :: OSI Approved :: Apache Software License",
"Programming Language :: Python :: 3",
"Programming Language :: Python :: 3.7",
"Programming Language :: Python :: 3.8",
"Programming Language :: Python :: 3.9",
"Programming Language :: Python :: 3.10",
],
}
setup(**config)