asm_to_csv/my_utils.py

104 lines
2.7 KiB
Python
Raw Normal View History

2024-04-15 20:01:20 +08:00
import logging
import os
2024-04-17 15:54:00 +08:00
import json
2024-04-17 10:28:01 +08:00
2024-04-15 20:01:20 +08:00
"""
日志工具
使用方法
logger = setup_logger(日志记录器的实例名字, 日志文件目录)
"""
2024-04-16 20:01:48 +08:00
2024-04-20 18:20:20 +08:00
def setup_logger(name, log_file, level=logging.INFO, reset=False):
2024-04-15 20:01:20 +08:00
"""Function setup as many loggers as you want"""
if not os.path.exists(os.path.dirname(log_file)):
os.makedirs(os.path.dirname(log_file))
formatter = logging.Formatter('%(asctime)s %(levelname)s %(message)s')
handler = logging.FileHandler(log_file)
handler.setFormatter(formatter)
# 控制台是否输出日志信息
# stream_handler = logging.StreamHandler()
# stream_handler.setFormatter(formatter)
logger = logging.getLogger(name)
logger.setLevel(level)
logger.addHandler(handler)
# 控制台
# logger.addHandler(stream_handler)
# 刷新原有log文件
2024-04-20 18:20:20 +08:00
if reset:
2024-04-15 20:01:20 +08:00
open(log_file, 'w').close()
return logger
"""
多线程工具
"""
THREAD_FULL = os.cpu_count()
THREAD_HALF = int(os.cpu_count() / 2)
2024-04-16 20:01:48 +08:00
2024-04-17 15:54:00 +08:00
def multi_thread_order(func, args, thread_num=THREAD_FULL):
2024-04-15 20:01:20 +08:00
"""
多线程执行函数
:param func: 函数
:param args: list函数参数
:param thread_num: 线程数
:return:
"""
import concurrent.futures
from tqdm import tqdm
logger = setup_logger('multi_thread', './multi_thread.log')
result = []
with concurrent.futures.ThreadPoolExecutor(max_workers=thread_num) as executor:
2024-04-16 20:01:48 +08:00
try:
futures_to_args = {
executor.submit(func, arg): arg for arg in args
}
for future in tqdm(concurrent.futures.as_completed(futures_to_args), total=len(args)):
try:
result.append(future.result())
except Exception as exc:
logger.error('%r generated an exception: %s' % (futures_to_args[future], exc))
except Exception as exc:
logger.error('%r generated an exception: %s' % (futures_to_args[future], exc))
2024-04-15 20:01:20 +08:00
return result
2024-04-16 20:01:48 +08:00
2024-04-20 18:20:20 +08:00
def multi_thread_disorder(func, thread_num=THREAD_FULL, **args):
2024-04-17 15:54:00 +08:00
import multiprocessing
from tqdm import tqdm
with multiprocessing.Pool(processes=thread_num) as pool:
list(tqdm(pool.imap_unordered(func, args), total=len(args)))
2024-04-16 20:01:48 +08:00
2024-04-17 15:54:00 +08:00
def save_json(filename, data):
2024-04-16 20:01:48 +08:00
data = json.dumps(data)
2024-04-22 13:14:01 +08:00
# 确保路径存在
os.makedirs(os.path.dirname(filename), exist_ok=True)
2024-04-16 20:01:48 +08:00
file = open(filename, 'w')
file.write(data)
file.close()
2024-04-17 15:54:00 +08:00
2024-04-20 18:20:20 +08:00
def continuation_json(filename, data):
data = json.dumps(data)
file = open(filename, 'a')
file.write(data)
file.close()
2024-04-17 15:54:00 +08:00
def load_json(filename):
file = open(filename, 'r')
data = json.loads(file.read())
file.close()
return data