123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960 |
- import pandas as pd
- from common.log_utils import logFactory
- from common.database_utils import database_util
- from tqdm import tqdm
- click_client = database_util.get_client()
- logger = logFactory("data gen").log
- if __name__ == "__main__":
- index = 0
- fetch_size = 1000000
- # part1
- # for i in tqdm(range(0, 15)):
- # t1_start = i * fetch_size
- # for j in tqdm(range(0, 74)):
- # try:
- # t2_start = j * fetch_size
- # sql = f"insert into l_neg_origin_06 " \
- # f"select t2.*,length(t2.EVENT_APP_USE.C) as I_appuse,{i} as PART from (select * from l_neg_uuid_06 limit {t1_start},{fetch_size}) t1 inner join (select * from Z_USER_TAG_FLAT_out_202106 limit {t2_start},{fetch_size}) t2 on t1.uuid==t2.uuid order by I_appuse desc limit 1 by uuid,EVENT_SPNAME_C"
- # # logger.info(sql)
- # click_client.execute(sql)
- # except Exception as e:
- # logger.info(f"第{i}大循环的第{j}小循环出错")
- # logger.info(str(e))
- # continue
- # part2
- # for i in tqdm(range(15, 30)):
- # t1_start = i * fetch_size
- # for j in tqdm(range(0, 74)):
- # try:
- # t2_start = j * fetch_size
- # sql = f"insert into l_neg_origin_06 " \
- # f"select t2.*,length(t2.EVENT_APP_USE.C) as I_appuse,{i} as PART from (select * from l_neg_uuid_06 limit {t1_start},{fetch_size}) t1 inner join (select * from Z_USER_TAG_FLAT_out_202106 limit {t2_start},{fetch_size}) t2 on t1.uuid==t2.uuid order by I_appuse desc limit 1 by uuid,EVENT_SPNAME_C"
- # # logger.info(sql)
- # click_client.execute(sql)
- # except Exception as e:
- # logger.info(f"第{i}大循环的第{j}小循环出错")
- # logger.info(str(e))
- # continue
- #
- # # part3
- for i in tqdm(range(30, 47)):
- t1_start = i * fetch_size
- for j in tqdm(range(0, 74)):
- try:
- t2_start = j * fetch_size
- sql = f"insert into l_neg_origin_06 " \
- f"select t2.*,length(t2.EVENT_APP_USE.C) as I_appuse,{i} as PART from (select * from l_neg_uuid_06 limit {t1_start},{fetch_size}) t1 inner join (select * from Z_USER_TAG_FLAT_out_202106 limit {t2_start},{fetch_size}) t2 on t1.uuid==t2.uuid order by I_appuse desc limit 1 by uuid,EVENT_SPNAME_C"
- # logger.info(sql)
- click_client.execute(sql)
- except Exception as e:
- logger.info(f"第{i}大循环的第{j}小循环出错")
- logger.info(str(e))
- continue
- pass
|