-
Notifications
You must be signed in to change notification settings - Fork 7
Commit
This commit does not belong to any branch on this repository, and may belong to a fork outside of the repository.
- Loading branch information
Showing
12 changed files
with
242 additions
and
20 deletions.
There are no files selected for viewing
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,66 @@ | ||
name: Databricks-compatibility | ||
on: [push] | ||
|
||
jobs: | ||
Databricks-compatibility-test: | ||
runs-on: ubuntu-22.04 | ||
steps: | ||
- uses: actions/checkout@v4 | ||
|
||
- name: Set up Python | ||
uses: actions/setup-python@v5 | ||
with: | ||
python-version: '3.11' | ||
|
||
- name: Display Python version | ||
run: python -c "import sys; print(sys.version)" | ||
|
||
- name: Install dependencies | ||
run: | | ||
cp -n databricks/requirements-databricks-15.4-LTS.txt . | ||
python -m pip install --upgrade pip | ||
pip install flake8 pytest | ||
if [ -f requirements-databricks-15.4-LTS.txt ]; then pip install -r requirements-databricks-15.4-LTS.txt; fi | ||
- name: Lint with flake8 | ||
run: | | ||
# stop the build if there are Python syntax errors or undefined names | ||
flake8 . --count --select=E9,F63,F7,F82 --show-source --statistics | ||
# exit-zero treats all errors as warnings. The GitHub editor is 127 chars wide | ||
flake8 . --count --exit-zero --max-complexity=10 --max-line-length=127 --statistics | ||
- name: Test with pytest | ||
run: | | ||
export PYTHONPATH=$PYTHONPATH:${{ github.workspace }}/src | ||
pytest src/tests | ||
- name: Build test Docker image | ||
run: | | ||
cp -n databricks/databricks.dockerfile . | ||
docker build -t databricks-test-image -f databricks.dockerfile . | ||
build-and-publish: | ||
needs: Databricks-compatibility-test | ||
runs-on: ubuntu-22.04 | ||
steps: | ||
- uses: actions/checkout@v4 | ||
- name: Set up Python 3.11 | ||
uses: actions/setup-python@v5 | ||
with: | ||
python-version: "3.11" | ||
- name: Install build dependencies | ||
run: | | ||
cp -n databricks/setup.cfg . | ||
cp -n databricks/pyproject.toml . | ||
sed -i 's/$/rc1+dbx/' src/syngen/VERSION | ||
cat src/syngen/VERSION | ||
python -m pip install --upgrade pip | ||
pip install build | ||
- name: Build Package | ||
run: python -m build . | ||
- name: Publish package | ||
if: github.event_name == 'push' && startsWith(github.ref, 'refs/tags') | ||
uses: pypa/gh-action-pypi-publish@release/v1 | ||
with: | ||
password: ${{ secrets.PYPI_TEST_TOKEN }} # For release: use secrets.PYPI_TOKEN | ||
verbose: true |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,3 @@ | ||
# This files related to the databricks compatible library | ||
|
||
For testing purposes only |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,23 @@ | ||
# syntax=docker/dockerfile:1 | ||
|
||
# Build the initial docker image: | ||
FROM databricksruntime/standard:15.4-LTS AS builder | ||
|
||
# Set arguments to handle proper pip install comand due to syngen rc version present in requirements file | ||
# For local tests, use the following parameter to pass build argument: | ||
# --build-arg PIP_INSTALL_CMD="pip install --index-url https://test.pypi.org/simple/ --extra-index-url https://pypi.org/simple/ --use-pep517 --no-cache-dir -r requirements.txt" | ||
|
||
ARG PIP_INSTALL_CMD="pip install --use-pep517 --no-cache-dir -r requirements-databricks-15.4-LTS.txt" | ||
|
||
# Minimize the number of RUN commands and clean up cache and temporary files | ||
RUN apt-get update && \ | ||
apt-get install -y gcc g++ ccache build-essential curl && \ | ||
apt-get autoremove -y && \ | ||
apt-get clean && \ | ||
rm -rf /var/lib/{apt,dpkg,cache,log} | ||
COPY src /src | ||
COPY requirements-databricks-15.4-LTS.txt /requirements-databricks-15.4-LTS.txt | ||
RUN /databricks/python3/bin/${PIP_INSTALL_CMD} | ||
ENV MPLCONFIGDIR=/tmp | ||
ENV PYTHONPATH="${PYTHONPATH}:/src" | ||
WORKDIR /src |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,3 @@ | ||
[build-system] | ||
requires = ["setuptools>=68.0.0", "wheel"] | ||
build-backend = "setuptools.build_meta" |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,37 @@ | ||
aiohttp>=3.9.0 | ||
attrs | ||
avro | ||
base32-crockford | ||
boto3 | ||
category_encoders==2.6.3 | ||
click | ||
Jinja2 | ||
keras==2.15.* | ||
lazy==1.4 | ||
loguru | ||
MarkupSafe==2.1.1 | ||
marshmallow==3.19.* | ||
matplotlib==3.7.* | ||
mlflow-skinny==2.11.* | ||
numpy==1.23.* | ||
openpyxl | ||
pandas==2.2.* | ||
pandavro==1.8.* | ||
pathos==0.2.* | ||
pillow==9.4.* | ||
psutil | ||
py-ulid | ||
pytest | ||
pytest-reportportal | ||
python-slugify[unidecode]>=7.0.0 | ||
PyYAML==6.* | ||
reportportal-client | ||
scikit_learn==1.3.* | ||
scipy==1.11.* | ||
seaborn==0.12.* | ||
setuptools==68.* | ||
tensorflow==2.15.* | ||
tqdm==4.66.3 | ||
Werkzeug==3.0.3 | ||
xlrd | ||
xlwt |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,82 @@ | ||
[metadata] | ||
name = syngen | ||
version = file: src/syngen/VERSION | ||
description = file: DESCRIPTION | ||
long_description = file: README.md | ||
long_description_content_type = text/markdown | ||
url = https://github.com/tdspora/syngen | ||
author = EPAM Systems, Inc. | ||
maintainer = Pavel Bobyrev | ||
license = GPLv3 License | ||
keywords = data, generation, synthetic, vae, tabular | ||
classifiers = | ||
Development Status :: 5 - Production/Stable | ||
Operating System :: POSIX :: Linux | ||
Operating System :: Microsoft :: Windows | ||
License :: OSI Approved :: GNU General Public License v3 (GPLv3) | ||
Programming Language :: Python :: 3.10 | ||
Programming Language :: Python :: 3.11 | ||
|
||
|
||
[options] | ||
package_dir = | ||
= src | ||
packages = find: | ||
include_package_data = True | ||
python_requires = >3.10, <3.12 | ||
install_requires = | ||
aiohttp>=3.9.0 | ||
attrs | ||
avro | ||
base32-crockford | ||
boto3 | ||
category_encoders==2.6.3 | ||
click | ||
Jinja2 | ||
keras==2.15.* | ||
lazy==1.4 | ||
loguru | ||
MarkupSafe==2.1.1 | ||
marshmallow==3.19.* | ||
matplotlib==3.7.* | ||
mlflow-skinny==2.11.* | ||
numpy==1.23.* | ||
openpyxl | ||
pandas==2.2.* | ||
pandavro==1.8.* | ||
pathos==0.2.* | ||
pillow==9.4.* | ||
psutil | ||
py-ulid | ||
pytest | ||
pytest-reportportal | ||
python-slugify[unidecode]>=7.0.0 | ||
PyYAML==6.* | ||
reportportal-client | ||
scikit_learn==1.3.* | ||
scipy==1.11.* | ||
seaborn==0.12.* | ||
setuptools==68.* | ||
tensorflow==2.15.* | ||
tqdm==4.66.3 | ||
Werkzeug==3.0.3 | ||
xlrd | ||
xlwt | ||
|
||
|
||
[options.extras_require] | ||
ui = | ||
streamlit==1.31.* | ||
streamlit_option_menu | ||
|
||
|
||
[options.packages.find] | ||
where = src | ||
[options.package_data] | ||
* = *.py, *.html, *.ttf, *.svg, *.css, *.js | ||
|
||
[options.entry_points] | ||
console_scripts = | ||
train = syngen.train:launch_train | ||
infer = syngen.infer:launch_infer | ||
syngen = syngen:main |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -1 +1 @@ | ||
0.9.46rc10 | ||
0.9.46rc11 |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters