You cannot select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
data-maker/pipeline.py

698 lines
22 KiB
Python

#!/usr/bin/env python3
5 years ago
class KEYS :
logger.write({"module":"bigquery","action":"read","input":{"sql":SQL}})
if 'autopilot' in ( list(args.keys())) :
else:
if df[name].unique().size > 0 :
4 years ago
if 'gpu' in args :
4 years ago
_approx = {}
4 years ago
# writer.write(_df[cols],schema=_schema,table=args['from'])
# if 'file' in args :
# DATA = np.array_split(DATA,PART_SIZE)
# job.start()
# jobs.append(job)
# # if len(jobs) == 1 :
# # job.join()
# Let us create n-jobs across n-gpus, The assumption here is the data that is produced will be a partition
# jobs.append(job)