Skip to content

Commit 6d094b0

Browse files
little polish
1 parent a14a2fd commit 6d094b0

File tree

9 files changed

+968
-8
lines changed

9 files changed

+968
-8
lines changed

Pipfile

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -8,6 +8,7 @@ loguru = "==0.6.*"
88
pandas = "==1.5.*"
99
scikit-learn = "*"
1010
tqdm = "*"
11+
jupyter = "*"
1112

1213
[dev-packages]
1314
black = "==23.*"

Pipfile.lock

Lines changed: 944 additions & 1 deletion
Some generated files are not rendered by default. Learn more about customizing how changed files appear on GitHub.

README.md

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1,4 +1,4 @@
1-
# lazy-learn
1+
![lazy-learn logo](docs/logo/transparent.png)
22
0.0.1
33

44
---

doc/logo/grayscale_transparent.png

58.1 KB
Loading

doc/logo/original.png

61.2 KB
Loading

doc/logo/transparent.png

65 KB
Loading

python/src/lazylearn/ingestion/ingestion_pipeline_steps/interpreter_step.py

Lines changed: 12 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -1,3 +1,4 @@
1+
import pandas as pd
12
from pandas import Series
23
from pipeline.pipeline import IngestionPipeline
34
from tqdm import tqdm
@@ -12,6 +13,7 @@ def apply(self, pipeline: IngestionPipeline):
1213
:param pipeline: parent IngestionPipeline
1314
:return:
1415
"""
16+
self.df = pipeline.df
1517
columns = pipeline.df.columns
1618
column_types = {}
1719

@@ -37,7 +39,10 @@ def analyze_column(self, column: Series):
3739
elif self.numeric_test(types):
3840
return "numeric"
3941

40-
return "object"
42+
elif self.datetime_check(column):
43+
return "datetime"
44+
else:
45+
return "object"
4146

4247
@staticmethod
4348
def categorical_test(values: list):
@@ -73,6 +78,9 @@ def numeric_test(types: list):
7378
def string_test(types: set):
7479
raise NotImplementedError
7580

76-
@staticmethod
77-
def date_check(types: set):
78-
raise NotImplementedError
81+
def datetime_check(self, column: Series):
82+
try:
83+
self.df[column.name] = pd.to_datetime(column)
84+
return True
85+
except:
86+
return False

python/src/lazylearn/models/models.py

Lines changed: 9 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1,7 +1,15 @@
1+
from pandas import DataFrame
2+
3+
14
class Dataset:
2-
def __init__(self):
5+
def __init__(self, df: DataFrame, column_type_map: dict):
36
self.name = None
47
self.description = None
8+
self.df = df
9+
self.column_type_map = column_type_map
10+
11+
def save(self):
12+
raise NotImplementedError
513

614

715
class Model:

python/src/lazylearn/pipeline/pipeline.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -31,4 +31,4 @@ def __init__(self):
3131
self.summary_stats: dict = {}
3232

3333
def response(self):
34-
return Dataset
34+
return Dataset(df=self.df, column_type_map=self.column_type_map)

0 commit comments

Comments
 (0)