2021-04-02 18:08:56 +00:00
|
|
|
import ebay_api
|
|
|
|
import numpy as np
|
|
|
|
|
|
|
|
'''
|
|
|
|
file used to compile methods from ebay_api.py for curating training data
|
|
|
|
'''
|
|
|
|
|
|
|
|
curate = ebay_api.CurateData()
|
|
|
|
raw_data = curate.import_raw()
|
2021-04-03 20:09:21 +00:00
|
|
|
training = curate.to_training(raw_data)
|
2021-04-02 18:08:56 +00:00
|
|
|
class_training = curate.class_training(training)
|
|
|
|
nvl_training = curate.nvl_training(training)
|
2021-04-03 20:09:21 +00:00
|
|
|
dropd = curate.drop_nvl_cols(nvl_training)
|
2021-04-02 18:08:56 +00:00
|
|
|
|
2021-04-04 21:38:04 +00:00
|
|
|
expanded_dfs = curate.expand_nvlclass(class_training, dropd)
|
|
|
|
expanded_class = expanded_dfs[0]
|
|
|
|
expanded_dropd = expanded_dfs[1]
|
2021-04-02 18:08:56 +00:00
|
|
|
|
2021-04-03 20:09:21 +00:00
|
|
|
# TODO # need to replace expanded df's PictureURL col values with destination urls
|
2021-04-04 21:38:04 +00:00
|
|
|
# TODO # still have the problem of duplicate listings. Possibly take care of this before you run curate
|