From 846fa99743eae03d87acd12a3503064398db0e8d Mon Sep 17 00:00:00 2001 From: Steve Nyemba Date: Tue, 30 Mar 2021 17:50:12 -0500 Subject: [PATCH] bug fix: data type and schema fields (order) --- pipeline.py | 3 ++- setup.py | 2 +- 2 files changed, 3 insertions(+), 2 deletions(-) diff --git a/pipeline.py b/pipeline.py index d00ddb7..47f8547 100644 --- a/pipeline.py +++ b/pipeline.py @@ -192,6 +192,7 @@ class Components : _columns = None skip_columns = [] _schema = schema + cols = [_item['name'] for _item in _schema] for _df in candidates : # # we need to format the fields here to make sure we have something cohesive @@ -222,7 +223,7 @@ class Components : _df = pd.DataFrame.join(df,_df) - writer.write(_df,schema=_schema,table=args['from']) + writer.write(_df[cols],schema=_schema,table=args['from']) # writer.write(df,table=table) pass else: diff --git a/setup.py b/setup.py index a2e6744..450d0d9 100644 --- a/setup.py +++ b/setup.py @@ -5,7 +5,7 @@ import sys def read(fname): return open(os.path.join(os.path.dirname(__file__), fname)).read() args = {"name":"data-maker", - "version":"1.4.2", + "version":"1.4.3", "author":"Vanderbilt University Medical Center","author_email":"steve.l.nyemba@vanderbilt.edu","license":"MIT", "packages":find_packages(),"keywords":["healthcare","data","transport","protocol"]} args["install_requires"] = ['data-transport@git+https://dev.the-phi.com/git/steve/data-transport.git','tensorflow==1.15','pandas','pandas-gbq','pymongo']