16 changed files with 88 additions and 477 deletions
--- a/README.md
+++ b/README.md
@ -18,20 +18,6 @@ Within the virtual environment perform the following :
    pip install git+https://github.com/lnyemba/data-transport.git
 ## Features
    - read/write from over a dozen databases
    - run ETL jobs seamlessly
    - scales and integrates into shared environments like apache zeppelin; jupyterhub; SageMaker; ...
 ## What's new
 Unlike older versions 2.0 and under, we focus on collaborative environments like jupyter-x servers; apache zeppelin:
    1. Simpler syntax to create reader or writer
    2. auth-file registry that can be referenced using a label
    3. duckdb support
 ## Learn More
--- a/info/init.py
+++ b/info/init.py
@ -1,6 +1,6 @@
 __app_name__  = 'data-transport'
 __author__ = 'The Phi Technology'
-__version__= '2.2.6'
+__version__= '2.0.4'
 __email__  = "info@the-phi.com"
 __license__=f"""
 Copyright 2010 - 2024, Steve L. Nyemba
@ -12,10 +12,3 @@ The above copyright notice and this permission notice shall be included in all c
 THE SOFTWARE IS PROVIDED “AS IS”, WITHOUT WARRANTY OF ANY KIND, EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
 """
 __whatsnew__=f"""version {__version__}, focuses on collaborative environments like jupyter-base servers (apache zeppelin; jupyter notebook, jupyterlab, jupyterhub)
    1. simpler syntax to create readers/writers
    2. auth-file registry that can be referenced using a label
    3. duckdb support
 """
--- a/notebooks/plugins.ipynb
+++ b/notebooks/plugins.ipynb
@ -1,149 +0,0 @@
 {
 "cells": [
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "#### Writing data-transport plugins\n",
    "\n",
    "The data-transport plugins are designed to automate pre/post processing i.e\n",
    "\n",
    "    - Read -> Post processing\n",
    "    - Write-> Pre processing\n",
    "    \n",
    "In this example we will assume, data and write both pre/post processing to any supported infrastructure. We will equally show how to specify the plugins within a configuration file"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 1,
   "metadata": {},
   "outputs": [],
   "source": [
    "#\n",
    "# Writing to Google Bigquery database\n",
    "#\n",
    "import transport\n",
    "from transport import providers\n",
    "import pandas as pd\n",
    "import os\n",
    "import shutil\n",
    "#\n",
    "#\n",
    "\n",
    "DATABASE = '/home/steve/tmp/demo.db3'\n",
    "if os.path.exists(DATABASE) :\n",
    "    os.remove(DATABASE)\n",
    "#\n",
    "#    \n",
    "_data = pd.DataFrame({\"name\":['James Bond','Steve Rogers','Steve Nyemba'],'age':[55,150,44]})\n",
    "litew = transport.get.writer(provider=providers.SQLITE,database=DATABASE)\n",
    "litew.write(_data,table='friends')"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "#### Reading from SQLite\n",
    "\n",
    "The cell below reads the data that has been written by the cell above and computes the average age from a plugin function we will write. \n",
    "\n",
    "- Basic read of the designated table (friends) created above\n",
    "- Read with pipeline functions defined in code\n",
    "\n",
    "**NOTE**\n",
    "\n",
    "It is possible to use **transport.factory.instance** or **transport.instance** or **transport.get.<[reader|writer]>** they are the same. It allows the maintainers to know that we used a factory design pattern."
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 4,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "           name  age\n",
      "0    James Bond   55\n",
      "1  Steve Rogers  150\n",
      "2  Steve Nyemba   44\n",
      "\n",
      "\n",
      "           name   age  autoinc\n",
      "0    James Bond   5.5        0\n",
      "1  Steve Rogers  15.0        1\n",
      "2  Steve Nyemba   4.4        2\n"
     ]
    }
   ],
   "source": [
    "\n",
    "import transport\n",
    "from transport import providers\n",
    "import os\n",
    "import numpy as np\n",
    "def _autoincrement (_data,**kwargs) :\n",
    "    \"\"\"\n",
    "    This function will add an autoincrement field to the table\n",
    "    \"\"\"\n",
    "    _data['autoinc'] = np.arange(_data.shape[0])\n",
    "    \n",
    "    return _data\n",
    "def reduce(_data,**_args) :\n",
    "    \"\"\"\n",
    "    This function will reduce the age of the data frame\n",
    "    \"\"\"\n",
    "    _data.age /= 10\n",
    "    return _data\n",
    "reader = transport.get.reader(provider=providers.SQLITE,database=DATABASE,table='friends')\n",
    "#\n",
    "# basic read of the data created in the first cell\n",
    "_df = reader.read()\n",
    "print (_df)\n",
    "print ()\n",
    "print()\n",
    "#\n",
    "# read of the data with pipeline function provided to alter the database\n",
    "print (reader.read(pipeline=[_autoincrement,reduce]))"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "The parameters for instianciating a transport object (reader or writer) can be found at [data-transport home](https://healthcareio.the-phi.com/data-transport)\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": []
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "Python 3",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.9.7"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 2
 }
--- a/notebooks/s3.ipynb
+++ b/notebooks/s3.ipynb
@ -1,131 +0,0 @@
 {
 "cells": [
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "#### Writing to AWS S3\n",
    "\n",
    "We have setup our demo environment with the label **aws** passed to reference our s3 access_key and secret_key and file (called friends.csv). In the cell below we will write the data to our aws s3 bucket named **com.phi.demo**"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 1,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "2.2.1\n"
     ]
    }
   ],
   "source": [
    "#\n",
    "# Writing to mongodb database\n",
    "#\n",
    "import transport\n",
    "from transport import providers\n",
    "import pandas as pd\n",
    "_data = pd.DataFrame({\"name\":['James Bond','Steve Rogers','Steve Nyemba'],'age':[55,150,44]})\n",
    "mgw = transport.get.writer(label='aws')\n",
    "mgw.write(_data)\n",
    "print (transport.__version__)"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "#### Reading from AWS S3\n",
    "\n",
    "The cell below reads the data that has been written by the cell above and computes the average age within a mongodb pipeline. The code in the background executes an aggregation using\n",
    "\n",
    "- Basic read of the designated file **friends.csv**\n",
    "- Compute average age using standard pandas functions\n",
    "\n",
    "**NOTE**\n",
    "\n",
    "By design **read** object are separated from **write** objects in order to avoid accidental writes to the database.\n",
    "Read objects are created with **transport.get.reader** whereas write objects are created with **transport.get.writer**"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 2,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "          bname  age\n",
      "0    James Bond   55\n",
      "1  Steve Rogers  150\n",
      "2  Steve Nyemba   44\n",
      "--------- STATISTICS ------------\n",
      "83.0\n"
     ]
    }
   ],
   "source": [
    "\n",
    "import transport\n",
    "from transport import providers\n",
    "import pandas as pd\n",
    "\n",
    "def cast(stream) :\n",
    "    print (stream)\n",
    "    return pd.DataFrame(str(stream))\n",
    "mgr = transport.get.reader(label='aws')\n",
    "_df = mgr.read()\n",
    "print (_df)\n",
    "print ('--------- STATISTICS ------------')\n",
    "print (_df.age.mean())"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "An **auth-file** is a file that contains database parameters used to access the database. \n",
    "For code in shared environments, we recommend \n",
    "\n",
    "1. Having the **auth-file** stored on disk \n",
    "2. and the location of the file is set to an environment variable.\n",
    "\n",
    "To generate a template of the **auth-file** open the **file generator wizard** found at visit https://healthcareio.the-phi.com/data-transport"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": []
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "Python 3",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.9.7"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 2
 }
--- a/setup.py
+++ b/setup.py
@ -18,8 +18,8 @@ args    = {
    # "packages":["transport","info","transport/sql"]},
    "packages": find_packages(include=['info','transport', 'transport.*'])}
-args["keywords"]=['mongodb','duckdb','couchdb','rabbitmq','file','read','write','s3','sqlite']
+args["keywords"]=['mongodb','couchdb','rabbitmq','file','read','write','s3','sqlite']
-args["install_requires"] = ['pyncclient','duckdb-engine','pymongo','sqlalchemy','pandas','typer','pandas-gbq','numpy','cloudant','pika','nzpy','termcolor','boto3','boto','pyarrow','google-cloud-bigquery','google-cloud-bigquery-storage','flask-session','smart_open','botocore','psycopg2-binary','mysql-connector-python','numpy','pymssql']
+args["install_requires"] = ['pyncclient','pymongo','sqlalchemy','pandas','typer','pandas-gbq','numpy','cloudant','pika','nzpy','boto3','boto','pyarrow','google-cloud-bigquery','google-cloud-bigquery-storage','flask-session','smart_open','botocore','psycopg2-binary','mysql-connector-python','numpy','pymssql']
 args["url"] =   "https://healthcareio.the-phi.com/git/code/transport.git"
 args['scripts'] = ['bin/transport']
 # if sys.version_info[0] == 2 :
--- a/transport/init.py
+++ b/transport/init.py
@ -22,7 +22,7 @@ from transport import sql, nosql, cloud, other
 import pandas as pd
 import json
 import os
-from info import __version__,__author__,__email__,__license__,__app_name__,__whatsnew__
+from info import __version__,__author__,__email__,__license__,__app_name__
 from transport.iowrapper import IWriter, IReader, IETL
 from transport.plugins import PluginLoader
 from transport import providers
@ -38,11 +38,7 @@ def init():
            if _provider_name.startswith('__') or _provider_name == 'common':
                continue
            PROVIDERS[_provider_name] = {'module':getattr(_module,_provider_name),'type':_module.__name__}
-def _getauthfile (path) :
+
    f = open(path)
    _object = json.loads(f.read())
    f.close()
    return _object
 def instance (**_args):
    """
    This function returns an object of to read or write from a supported database provider/vendor
@ -81,15 +77,12 @@ def instance (**_args):
        if not registry.isloaded () :
            if ('path' in _args and registry.exists(_args['path'] )) or registry.exists():
                registry.load() if 'path' not in _args else registry.load(_args['path'])
        _info = {}
        if 'label' in _args and registry.isloaded():
            _info = registry.get(_args['label'])
-        else:
+            
-            _info = registry.get()    
+            if _info :
-        if _info :
+                #
-            #
+                _args = dict(_args,**_info)
            # _args = dict(_args,**_info)
            _args = dict(_info,**_args) #-- we can override the registry parameters with our own arguments
    if 'provider' in _args and _args['provider'] in PROVIDERS :
        _info = PROVIDERS[_args['provider']]
@ -134,7 +127,7 @@ class get :
    """
    @staticmethod
    def reader (**_args):
-        if not _args or ('provider' not in _args and 'label' not in _args):
+        if not _args :
            _args['label'] = 'default'
        _args['context'] = 'read'
        return instance(**_args)
@ -143,7 +136,7 @@ class get :
        """
        This function is a wrapper that will return a writer to a database. It disambiguates the interface
        """
-        if not _args or ('provider' not in _args and 'label' not in _args):
+        if not _args :
            _args['label'] = 'default'
        _args['context'] = 'write'
        return instance(**_args)
--- a/transport/cloud/s3.py
+++ b/transport/cloud/s3.py
@ -3,13 +3,10 @@ Data Transport - 1.0
 Steve L. Nyemba, The Phi Technology LLC
 This file is a wrapper around s3 bucket provided by AWS for reading and writing content
 TODO:
 	- Address limitations that will properly read csv if it is stored with content type text/csv
 """
 from datetime import datetime
-import boto3
+import boto
-# from boto.s3.connection import S3Connection, OrdinaryCallingFormat
+from boto.s3.connection import S3Connection, OrdinaryCallingFormat
 import numpy as np
 import botocore
 from smart_open import smart_open
@ -17,7 +14,6 @@ import sys
 import json
 from io import StringIO
 import pandas as pd
 import json
 class s3 :
@ -33,37 +29,46 @@ class s3 :
 			@param filter		filename or filtering elements
 		"""
 		try:
-			self._client = boto3.client('s3',aws_access_key_id=args['access_key'],aws_secret_access_key=args['secret_key'],region_name=args['region'])
+			self.s3 = S3Connection(args['access_key'],args['secret_key'],calling_format=OrdinaryCallingFormat())			
-			self._bucket_name = args['bucket']	
+			self.bucket = self.s3.get_bucket(args['bucket'].strip(),validate=False) if 'bucket' in args else None
-			self._file_name = args['file']
+			# self.path = args['path']
-			self._region = args['region']
+			self.filter = args['filter'] if 'filter' in args else None
 			self.filename = args['file'] if 'file' in args else None
 			self.bucket_name = args['bucket'] if 'bucket' in args else None
 		except Exception as e :
 			self.s3 = None
 			self.bucket = None
 			print (e)
 			pass
 	def has(self,**_args):
 		_found = None
 		try:
 			if 'file' in _args and 'bucket' in _args:
 				_found = self.meta(**_args)
 			elif 'bucket' in _args and not 'file' in _args:
 				_found =  self._client.list_objects(Bucket=_args['bucket']) 
 			elif 'file' in _args and not 'bucket' in _args :
 				_found = self.meta(bucket=self._bucket_name,file = _args['file'])
 		except Exception as e:
 			_found = None
 			pass
 		return type(_found) == dict
 	def meta(self,**args):
 		"""
 		This function will return information either about the file in a given bucket
 		:name name of the bucket
 		"""
-		_bucket = self._bucket_name if 'bucket' not in args else args['bucket']
+		info = self.list(**args)
-		_file =  self._file_name if 'file' not in args else args['file']
+		[item.open() for item in info]
-		_data = self._client.get_object(Bucket=_bucket,Key=_file)
+		return [{"name":item.name,"size":item.size} for item in info]
-		return _data['ResponseMetadata']
+	def list(self,**args):
-	def close(self):
+		"""
-		self._client.close()	
+		This function will list the content of a bucket, the bucket must be provided by the name
 		:name	name of the bucket
 		"""
 		return list(self.s3.get_bucket(args['name']).list())
 	def buckets(self):
 		#
 		# This function will return all buckets, not sure why but it should be used cautiously 
 		# based on why the s3 infrastructure is used
 		#
 		return [item.name for item in self.s3.get_all_buckets()]
 		# def buckets(self):
 		pass
 		# """
 		# This function is a wrapper around the bucket list of buckets for s3
 		# """
 		# return self.s3.get_all_buckets()
 class Reader(s3) :
 	"""	
@ -72,66 +77,51 @@ class Reader(s3) :
 		- stream content	if file is Not None
 		@TODO: support read from all buckets, think about it
 	"""
-	def __init__(self,**_args) :
+	def __init__(self,**args) :
-			super().__init__(**_args)
+			s3.__init__(self,**args)
-	
+	def files(self):
-	def _stream(self,**_args):
+		r = []
 		"""
 			At this point we should stream a file from a given bucket
 		"""
 		_object = self._client.get_object(Bucket=_args['bucket'],Key=_args['file'])
 		_stream = None
 		try:
-			_stream = _object['Body'].read()
+			return [item.name for item in self.bucket if item.size > 0]
 		except Exception as e:
 			pass
-		if not _stream :
+		return r
-			return None
+	def stream(self,limit=-1):
-		if _object['ContentType'] in ['text/csv'] :
+		"""
-			return pd.read_csv(StringIO(str(_stream).replace("\\n","\n").replace("\\r","").replace("\'","")))
+			At this point we should stream a file from a given bucket
 		"""
 		key = self.bucket.get_key(self.filename.strip())
 		if key is None :
 			yield None
 		else:
-			return _stream
+			count = 0
-		
+			with smart_open(key) as remote_file:
 				for line in remote_file:
 					if count == limit and limit > 0 :
 						break
 				yield line
 				count += 1
 	def read(self,**args) :
-		
+		if self.filename is None :
-		_name = self._file_name if 'file' not in args else args['file']
+			# 
-		_bucket = args['bucket'] if 'bucket' in args else self._bucket_name
+		# returning the list of files because no one file was specified.
-		return self._stream(bucket=_bucket,file=_name)
+			return self.files()
-		
+		else:
 			limit = args['size'] if 'size' in args else -1
 			return self.stream(limit)
 class Writer(s3) :
 	"""
-	"""
+	def __init__(self,**args) :
-	def __init__(self,**_args) :
+		s3.__init__(self,**args)
-		super().__init__(**_args)
+	def mkdir(self,name):
 		#
 		# 
 		if not self.has(bucket=self._bucket_name) :
 			self.make_bucket(self._bucket_name)
 	def make_bucket(self,bucket_name):
 		"""
-		This function will create a folder in a bucket,It is best that the bucket is organized as a namespace
+		This function will create a folder in a bucket
 		:name name of the folder
 		"""
-		
+		self.s3.put_object(Bucket=self.bucket_name,key=(name+'/'))
-		self._client.create_bucket(Bucket=bucket_name,CreateBucketConfiguration={'LocationConstraint': self._region})
+	def write(self,content):
-	def write(self,_data,**_args):
+		file = StringIO(content.decode("utf8"))
-		"""
+		self.s3.upload_fileobj(file,self.bucket_name,self.filename)
 		This function will write the data to the s3 bucket, files can be either csv, or json formatted files
 		"""
 		content = 'text/plain'
 		if type(_data) == pd.DataFrame :
 			_stream = _data.to_csv(index=False)
 			content = 'text/csv'
 		elif type(_data) == dict :
 			_stream = json.dumps(_data)
 			content = 'application/json'
 		else:
 			_stream = _data
 		file = StringIO(_stream)
 		bucket = self._bucket_name if 'bucket' not in _args else _args['bucket']
 		file_name = self._file_name if 'file' not in _args else _args['file']
 		self._client.put_object(Bucket=bucket, Key = file_name, Body=_stream,ContentType=content)
 		pass
--- a/transport/duck.py
+++ b/transport/duck.py
@ -1,19 +0,0 @@
 """
 This file will be intended to handle duckdb database
 """
 import duckdb
 from transport.common import Reader,Writer
 class Duck(Reader):
    def __init__(self,**_args):
        super().__init__(**_args)
        self._path = None if 'path' not in _args else _args['path']
        self._handler = duckdb.connect() if not self._path else duckdb.connect(self._path)
 class DuckReader(Duck) :
    def __init__(self,**_args):
        super().__init__(**_args)
    def read(self,**_args) :
        pass
--- a/transport/iowrapper.py
+++ b/transport/iowrapper.py
@ -52,13 +52,6 @@ class IO:
        if hasattr(self._agent,'apply') :
            return self._agent.apply(_query)
        return None
    def submit(self,_query):
        return self.delegate('submit',_query)
    def delegate(self,_name,_query):
        if hasattr(self._agent,_name) :
            pointer = getattr(self._agent,_name)
            return pointer(_query)
        return None
 class IReader(IO):
    """
    This is a wrapper for read functionalities
--- a/transport/nosql/mongodb.py
+++ b/transport/nosql/mongodb.py
@ -33,8 +33,6 @@ class Mongo :
            :password   password for current user
        """
        self.host = 'localhost' if 'host' not in args else args['host']
        if ':' not in self.host and 'port' in args :
            self.host = ':'.join([self.host,str(args['port'])])
        self.mechanism= 'SCRAM-SHA-256' if 'mechanism' not in args else args['mechanism']
        # authSource=(args['authSource'] if 'authSource' in args else self.dbname)
        self._lock = False if 'lock' not in args else args['lock']
--- a/transport/other/init.py
+++ b/transport/other/init.py
@ -1 +1 @@
-from . import files, http, rabbitmq, callback, files, console
+from . import files, http, rabbitmq, callback, files
--- a/transport/providers/init.py
+++ b/transport/providers/init.py
@ -10,11 +10,8 @@ HTTP='http'
 BIGQUERY	='bigquery'
 FILE 	= 'file'
 ETL = 'etl'
 SQLITE = 'sqlite'
 SQLITE3= 'sqlite3'
 DUCKDB = 'duckdb'
 REDSHIFT = 'redshift'
 NETEZZA = 'netezza'
 MYSQL = 'mysql'
@ -45,6 +42,5 @@ PGSQL	= POSTGRESQL
 AWS_S3  = 's3'
 RABBIT = RABBITMQ
 # QLISTENER = 'qlistener'
--- a/transport/registry.py
+++ b/transport/registry.py
@ -10,11 +10,6 @@ This class manages data from the registry and allows (read only)
 """
 REGISTRY_PATH=os.sep.join([os.environ['HOME'],'.data-transport'])
 #
 # This path can be overriden by an environment variable ...
 #
 if 'DATA_TRANSPORT_REGISTRY_PATH' in os.environ :
    REGISTRY_PATH = os.environ['DATA_TRANSPORT_REGISTRY_PATH']
 REGISTRY_FILE= 'transport-registry.json'
 DATA = {}
@ -42,7 +37,7 @@ def init (email,path=REGISTRY_PATH,override=False):
    Initializing the registry and will raise an exception in the advent of an issue
    """
    p = '@' in email
-    q = False if '.' not in email else email.split('.')[-1] in ['edu','com','io','ai','org']
+    q = False if '.' not in email else email.split('.')[-1] in ['edu','com','io','ai']
    if p and q :
        _config = {"email":email,'version':__version__}
        if not os.path.exists(path):
--- a/transport/sql/init.py
+++ b/transport/sql/init.py
@ -3,7 +3,7 @@ This namespace/package wrap the sql functionalities for a certain data-stores
    - netezza, postgresql, mysql and sqlite
    - mariadb, redshift (also included)
 """
-from . import postgresql, mysql, netezza, sqlite, sqlserver, duckdb
+from . import postgresql, mysql, netezza, sqlite, sqlserver
 #
--- a/transport/sql/common.py
+++ b/transport/sql/common.py
@ -3,8 +3,6 @@ This file encapsulates common operations associated with SQL databases via SQLAl
 """
 import sqlalchemy as sqa
 from sqlalchemy import text 
 import pandas as pd
 class Base:
@ -58,15 +56,7 @@ class Base:
        @TODO: Execution of stored procedures
        """
-        if sql.lower().startswith('select') or sql.lower().startswith('with') :
+        return pd.read_sql(sql,self._engine) if sql.lower().startswith('select') or sql.lower().startswith('with') else None
            return pd.read_sql(sql,self._engine) 
        else:
            _handler = self._engine.connect()
            _handler.execute(text(sql))
            _handler.commit ()
            _handler.close()
        return None
 class SQLBase(Base):
    def __init__(self,**_args):
--- a/transport/sql/duckdb.py
+++ b/transport/sql/duckdb.py
@ -1,24 +0,0 @@
 """
 This module implements the handler for duckdb (in memory or not)
 """
 from transport.sql.common import Base, BaseReader, BaseWriter
 class Duck :
    def __init__(self,**_args):
        #
        # duckdb with none as database will operate as an in-memory database
        #
        self.database = _args['database'] if 'database' in _args else ''
    def get_provider(self):
        return "duckdb"
    def _get_uri(self,**_args):
        return f"""duckdb:///{self.database}"""
 class Reader(Duck,BaseReader) :
    def __init__(self,**_args):
        Duck.__init__(self,**_args)
        BaseReader.__init__(self,**_args)
 class Writer(Duck,BaseWriter):
    def __init__(self,**_args):
        Duck.__init__(self,**_args)
        BaseWriter.__init__(self,**_args)
		`@ -1 +1 @@`
			`from . import files, http, rabbitmq, callback, files, console`				`from . import files, http, rabbitmq, callback, files`