forked from capitalone/DataProfiler
-
Notifications
You must be signed in to change notification settings - Fork 0
/
setup.py
113 lines (99 loc) · 4.36 KB
/
setup.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
"""A setuptools for the Data Profiler Application and Python Libraries."""
import os
# To use a consistent encoding
from codecs import open
from os import path
# Always prefer setuptools over distutils
from setuptools import find_packages, setup
# Load package version
from dataprofiler.version import __version__
here = path.abspath(path.dirname(__file__))
# Get the long description from the README file
with open(path.join(here, "README.md"), encoding="utf-8") as f:
LONG_DESCRIPTION = f.read()
# Get the install_requirements from requirements.txt
with open(path.join(here, "requirements.txt"), encoding="utf-8") as f:
required_packages = f.read().splitlines()
# Get the install_requirements from requirements-ml.txt
with open(path.join(here, "requirements-ml.txt"), encoding="utf-8") as f:
ml_packages = f.read().splitlines()
# Get the install_requirements from requirements-reports.txt
with open(path.join(here, "requirements-reports.txt"), encoding="utf-8") as f:
reports_packages = f.read().splitlines()
resource_dir = "resources/"
default_labeler_files = [
(d, [os.path.join(d, f) for f in files]) for d, _, files in os.walk(resource_dir)
]
DESCRIPTION = (
"What is in your data? Detect schema, statistics and entities in almost any file."
)
setup(
name="DataProfiler",
version=__version__,
python_requires=">=3.7",
description=DESCRIPTION,
long_description=LONG_DESCRIPTION,
long_description_content_type="text/markdown",
# The project's main homepage.
url="https://github.com/capitalone/data-profiler",
# Author details
author="Jeremy Goodsitt, Taylor Turner, Michael Davis, Kenny Bean, Tyler Farnan",
# Choose your license
license="Apache License, Version 2.0",
# See https://pypi.python.org/pypi?%3Aaction=list_classifiers
classifiers=[
# How mature is this project? Common values are
# 3 - Alpha
# 4 - Beta
# 5 - Production/Stable
"Development Status :: 5 - Production/Stable",
# Indicate who your project is intended for
"Intended Audience :: Developers",
"Intended Audience :: Education",
"Intended Audience :: Information Technology",
"Intended Audience :: Science/Research",
"Intended Audience :: System Administrators",
"Topic :: Education",
"Topic :: Scientific/Engineering",
"Topic :: Scientific/Engineering :: Information Analysis",
"Topic :: Security",
"Topic :: Software Development :: Build Tools",
# Pick your license as you wish (should match "license" above)
"License :: OSI Approved :: Apache Software License",
# Specify the Python versions you support here. In particular, ensure
# that you indicate whether you support Python 3 or both.
"Programming Language :: Python :: 3",
],
# What does your project relate to?
keywords="Data Investigation",
# You can just specify the packages manually here if your project is
# simple. Or you can use find_packages().
# packages=find_packages(exclude=['src/test', 'src/sample']),
packages=find_packages(exclude=["tests", "examples"]),
# List run-time dependencies here. These will be installed by pip when
# your project is installed. For an analysis of "install_requires" vs pip's
# requirements files see:
# https://packaging.python.org/en/latest/requirements.html
install_requires=required_packages,
# List of run-time dependencies for the labeler. These will be installed
# by pip when someone installs the project[<label>].
extras_require={
"ml": ml_packages,
"reports": reports_packages,
"full": ml_packages + reports_packages,
},
# # If there are data files included in your packages that need to be
# # installed, specify them here. If using Python 2.6 or less, then these
# # have to be included in MANIFEST.in as well.
# package_data={
# 'data': [],
# },
#
# # Although 'package_data' is the preferred approach, in some case you may
# # need to place data files outside of your packages. See:
# # http://docs.python.org/3.4/distutils/setupscript.html#installing-additional-files # noqa
# # In this case, 'data_file' will be installed into '<sys.prefix>/my_data'
data_files=default_labeler_files,
include_package_data=True,
)
print("find_packages():", find_packages())