-
Notifications
You must be signed in to change notification settings - Fork 163
/
setup.py
124 lines (109 loc) · 4.7 KB
/
setup.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
"""A setuptools for the Data Profiler Application and Python Libraries."""
import os
# To use a consistent encoding
from codecs import open
from os import path
# Always prefer setuptools over distutils
from setuptools import find_packages, setup
# Load package version
from dataprofiler.version import __version__
here = path.abspath(path.dirname(__file__))
# Get the long description from the README file
with open(path.join(here, "README.md"), encoding="utf-8") as f:
tag_to_replace = ""
tag_found = False
LONG_DESCRIPTION = ""
for line in f:
LONG_DESCRIPTION += line
if '<p text-align="left">' in line or tag_found:
tag_found = True
tag_to_replace += line
if "</p>" in line and tag_found:
tag_found = False
LONG_DESCRIPTION = LONG_DESCRIPTION.replace(tag_to_replace, "")
# Get the install_requirements from requirements.txt
with open(path.join(here, "requirements.txt"), encoding="utf-8") as f:
required_packages = f.read().splitlines()
# Get the install_requirements from requirements-ml.txt
with open(path.join(here, "requirements-ml.txt"), encoding="utf-8") as f:
ml_packages = f.read().splitlines()
# Get the install_requirements from requirements-reports.txt
with open(path.join(here, "requirements-reports.txt"), encoding="utf-8") as f:
reports_packages = f.read().splitlines()
resource_dir = "resources"
default_labeler_files = [
(d, [os.path.join(d, f) for f in files]) for d, _, files in os.walk(resource_dir)
]
DESCRIPTION = (
"What is in your data? Detect schema, statistics and entities in almost any file."
)
setup(
name="DataProfiler",
version=__version__,
python_requires=">=3.9",
description=DESCRIPTION,
long_description=LONG_DESCRIPTION,
long_description_content_type="text/markdown",
# The project's main homepage.
url="https://github.com/capitalone/data-profiler",
# Author details
author="Jeremy Goodsitt, Taylor Turner, Michael Davis, Kenny Bean, Tyler Farnan",
# Choose your license
license="Apache License, Version 2.0",
# See https://pypi.python.org/pypi?%3Aaction=list_classifiers
classifiers=[
# How mature is this project? Common values are
# 3 - Alpha
# 4 - Beta
# 5 - Production/Stable
"Development Status :: 5 - Production/Stable",
# Indicate who your project is intended for
"Intended Audience :: Developers",
"Intended Audience :: Education",
"Intended Audience :: Information Technology",
"Intended Audience :: Science/Research",
"Intended Audience :: System Administrators",
"Topic :: Education",
"Topic :: Scientific/Engineering",
"Topic :: Scientific/Engineering :: Information Analysis",
"Topic :: Security",
"Topic :: Software Development :: Build Tools",
# Pick your license as you wish (should match "license" above)
"License :: OSI Approved :: Apache Software License",
# Specify the Python versions you support here. In particular, ensure
# that you indicate whether you support Python 3 or both.
"Programming Language :: Python :: 3",
],
# What does your project relate to?
keywords="Data Investigation",
# You can just specify the packages manually here if your project is
# simple. Or you can use find_packages().
# packages=find_packages(exclude=['src/test', 'src/sample']),
packages=find_packages(exclude=["tests", "examples"]),
# List run-time dependencies here. These will be installed by pip when
# your project is installed. For an analysis of "install_requires" vs pip's
# requirements files see:
# https://packaging.python.org/en/latest/requirements.html
install_requires=required_packages,
# List of run-time dependencies for the labeler. These will be installed
# by pip when someone installs the project[<label>].
extras_require={
"ml": ml_packages,
"reports": reports_packages,
"full": ml_packages + reports_packages,
},
# # If there are data files included in your packages that need to be
# # installed, specify them here. If using Python 2.6 or less, then these
# # have to be included in MANIFEST.in as well.
# package_data={
# 'data': [],
# },
#
# # Although 'package_data' is the preferred approach, in some case you may
# # need to place data files outside of your packages. See:
# # http://docs.python.org/3.4/distutils/setupscript.html#installing-additional-files # noqa
# # In this case, 'data_file' will be installed into '<sys.prefix>/my_data'
data_files=default_labeler_files,
include_package_data=True,
)
print("find_packages():", find_packages())