mirror of
https://github.com/ail-project/ail-framework.git
synced 2024-11-30 09:47:17 +00:00
fix: [urlexport importer] fix item name + redis config
This commit is contained in:
parent
b4cb14798c
commit
64fae5d7df
2 changed files with 9 additions and 1 deletions
|
@ -33,11 +33,17 @@ class Ail_feeder_urlextract(Default_json):
|
||||||
# use twitter timestamp ?
|
# use twitter timestamp ?
|
||||||
item_date = datetime.date.today().strftime("%Y/%m/%d")
|
item_date = datetime.date.today().strftime("%Y/%m/%d")
|
||||||
item_id = str(self.json_item['meta']['twitter:url-extracted'])
|
item_id = str(self.json_item['meta']['twitter:url-extracted'])
|
||||||
|
item_id = item_id.split('//')
|
||||||
|
if len(item_id) > 1:
|
||||||
|
item_id = ''.join(item_id[1:])
|
||||||
|
else:
|
||||||
|
item_id = item_id[0]
|
||||||
|
item_id = item_id.replace('/', '_')
|
||||||
if len(item_id) > 215:
|
if len(item_id) > 215:
|
||||||
item_id = '{}{}.gz'.format(item_id[:215], str(uuid.uuid4()))
|
item_id = '{}{}.gz'.format(item_id[:215], str(uuid.uuid4()))
|
||||||
else:
|
else:
|
||||||
item_id = '{}{}.gz'.format(item_id, str(uuid.uuid4()))
|
item_id = '{}{}.gz'.format(item_id, str(uuid.uuid4()))
|
||||||
return os.path.join('urlextract', item_date, item_id) + '.gz'
|
return os.path.join('urlextract', item_date, item_id)
|
||||||
|
|
||||||
# # TODO:
|
# # TODO:
|
||||||
def process_json_meta(self, process, item_id):
|
def process_json_meta(self, process, item_id):
|
||||||
|
|
|
@ -11,6 +11,8 @@ config_loader = ConfigLoader.ConfigLoader()
|
||||||
# get and sanityze PASTE DIRECTORY
|
# get and sanityze PASTE DIRECTORY
|
||||||
PASTES_FOLDER = os.path.join(os.environ['AIL_HOME'], config_loader.get_config_str("Directories", "pastes")) + '/'
|
PASTES_FOLDER = os.path.join(os.environ['AIL_HOME'], config_loader.get_config_str("Directories", "pastes")) + '/'
|
||||||
PASTES_FOLDER = os.path.join(os.path.realpath(PASTES_FOLDER), '')
|
PASTES_FOLDER = os.path.join(os.path.realpath(PASTES_FOLDER), '')
|
||||||
|
|
||||||
|
r_serv_metadata = config_loader.get_redis_conn("ARDB_Metadata")
|
||||||
config_loader = None
|
config_loader = None
|
||||||
|
|
||||||
def exist_item(item_id):
|
def exist_item(item_id):
|
||||||
|
|
Loading…
Reference in a new issue