diff --git a/analysis.py b/analysis.py index df616bf..19b4fac 100644 --- a/analysis.py +++ b/analysis.py @@ -9,7 +9,7 @@ from pyspark.ml.feature import PCA from pyspark.ml.linalg import Vectors -from etl import load +from pipe.etl import load def category_distribution(data): """ diff --git a/etl.py b/pipe/etl.py similarity index 100% rename from etl.py rename to pipe/etl.py diff --git a/train.py b/train.py index e91147a..3ef4f49 100644 --- a/train.py +++ b/train.py @@ -14,7 +14,6 @@ import jax import json import numpy as np -from pipe.pipe import SpectrogramPipe import pyspark as spark #from pyspark.ml.feature import OneHotEncoder, StringIndexer from pyspark.sql import SparkSession, functions, types, Row @@ -25,7 +24,7 @@ from sklearn.preprocessing import OneHotEncoder from model.model import TimeSeriesTransformer as TSTF -from etl import load +from pipe.etl import load with open("parameters.json", "r") as file: params = json.load(file)