# coding: utf-8 from os import scandir from os.path import isfile, exists from sys import argv from openpyxl import load_workbook from time import time, sleep, strftime, localtime from threading import Thread from pandas import read_csv class GetThreadResult(Thread): def __init__(self, func, args=()): super(GetThreadResult, self).__init__() self.func = func self.args = args self.result = 0 def run(self): sleep(1) self.result = self.func(*self.args) def get_result(self): Thread.join(self) # 等待线程执行完毕 try: return self.result except Exception as Err: return None def data_process(result_file, raw_data_dirs, av, rr, axis, vel, trq, w2t, estop): # 功能:完成一个结果文件的数据处理 # 参数:结果文件,数据目录,以及预读取的参数 # 返回值:- file_name = result_file.split('\\')[-1] w2t(f"正在打开文件 {file_name} 需要 1min 左右", 1, 0, 'orange') global stop stop = 0 t_excel = GetThreadResult(load_workbook, args=(result_file, )) t_wait = Thread(target=w2t_local, args=('.', 1, w2t)) t_excel.start() t_wait.start() t_excel.join() wb_result = t_excel.get_result() stop = 1 sleep(1.1) w2t('') prefix = result_file.split('\\')[-1].split('_')[0] for raw_data_dir in raw_data_dirs: if raw_data_dir.split('\\')[-1].split('_')[0] == prefix: now_doing_msg(raw_data_dir, 'start', w2t) _, data_files = traversal_files(raw_data_dir, w2t) # 数据文件串行处理模式--------------------------------- # count = 1 # for data_file in data_files: # now_doing_msg(data_file, 'start', w2t) # single_file_process(data_file, wb_result, count, av, rr, axis, vel, trq, w2t, estop) # count += 1 # now_doing_msg(data_file, 'done', w2t) # --------------------------------------------------- # 数据文件并行处理模式--------------------------------- threads = [Thread(target=single_file_process, args=(data_files[0], wb_result, 1, av, rr, axis, vel, trq, w2t, estop)), Thread(target=single_file_process, args=(data_files[1], wb_result, 2, av, rr, axis, vel, trq, w2t, estop)), Thread(target=single_file_process, args=(data_files[2], wb_result, 3, av, rr, axis, vel, trq, w2t, estop))] [t.start() for t in threads] [t.join() for t in threads] # --------------------------------------------------- now_doing_msg(raw_data_dir, 'done', w2t) now_doing_msg(result_file, 'done', w2t) w2t(f"正在保存文件 {file_name} 需要 1min 左右", 1, 0, 'orange') stop = 0 t_excel = Thread(target=wb_result.save, args=(result_file, )) t_wait = Thread(target=w2t_local, args=('.', 1, w2t)) t_excel.start() t_wait.start() t_excel.join() stop = 1 sleep(1.1) w2t('\n') def check_files(raw_data_dirs, result_files, w2t): # 功能:检查数据文件以及结果文件的合规性 # 参数:数据文件夹,结果文件 # 返回值:- if len(result_files) != 3: msg = "结果文件数目错误,结果文件有且只有三个,请确认!" for result_file in result_files: w2t(result_file) w2t(msg, 0, 2, 'red') prefix = [] for result_file in result_files: prefix.append(result_file.split('\\')[-1].split('_')[0]) if not sorted(prefix) == sorted(['reach33', 'reach66', 'reach100']): wd = result_files[0].split('\\') del wd[-1] wd = '\\'.join(wd) msg = f"""请关闭所有相关数据文件,并检查工作目录 {wd} 下,有且只允许有类似如下三个文件: 1. reach33_XXX制动性能测试.xlsx 2. reach66_XXX制动性能测试.xlsx 3. reach100_XX制动性能测试.xlsx""" w2t(msg, 0, 3, 'red') for raw_data_dir in raw_data_dirs: components = raw_data_dir.split('\\')[-1].split('_') sorted(components) if components[0] not in ['reach33', 'reach66', 'reach100'] or \ components[1] not in ['load33', 'load66', 'load100'] or \ components[2] not in ['speed33', 'speed66', 'speed100']: msg = f"""报错信息:数据目录 {raw_data_dir} 命名不合规,请参考如下形式: 命名规则:reachAA_loadBB_speedCC 规则解释:AA/BB/CC 指的是臂展/负载/速度的比例,例如reach66_load100_speed33:66%臂展,100%负载以及33%速度情况下的测试结果文件夹""" w2t(msg, 0, 4, 'red') _, raw_data_files = traversal_files(raw_data_dir, w2t) if len(raw_data_files) != 3: msg = f"数据目录 {raw_data_dir} 下数据文件个数错误,每个数据目录下有且只能有三个以 .data 为后缀的数据文件" w2t(msg, 0, 5, 'red') for raw_data_file in raw_data_files: if not raw_data_file.split('\\')[-1].endswith('.data'): msg = f"数据文件 {raw_data_file} 后缀错误,每个数据目录下有且只能有三个以 .data 为后缀的数据文件" w2t(msg, 0, 6, 'red') w2t("数据目录合规性检查结束,未发现问题......") def now_doing_msg(docs, flag, w2t): # 功能:输出正在处理的文件或目录 # 参数:文件或目录,start 或 done 标识 # 返回值:- now = strftime('%Y-%m-%d %H:%M:%S', localtime(time())) file_type = 'file' if isfile(docs) else 'dir' if flag == 'start' and file_type == 'dir': w2t(f"[{now}] 正在处理目录 {docs} 中的数据......") elif flag == 'start' and file_type == 'file': w2t(f"[{now}] 正在处理文件 {docs} 中的数据......") elif flag == 'done' and file_type == 'dir': w2t(f"[{now}] 目录 {docs} 数据文件已处理完毕") elif flag == 'done' and file_type == 'file': w2t(f"[{now}] 文件 {docs} 数据已处理完毕") def w2t_local(msg, wait, w2t): while True: global stop if stop == 0 and wait != 0: sleep(1) w2t(msg, wait, 0, 'orange') else: break def single_file_process(data_file, wb_result, count, av, rr, axis, vel, trq, w2t, estop): # 功能:完成单个数据文件的处理 # 参数:如上 # 返回值:- df = read_csv(data_file, sep='\t') conditions = sorted(data_file.split('\\')[-2].split('_')) # ['loadxx', 'reachxx', 'speedxx'] result_sheet_name = find_result_sheet_name(conditions, count) ws_result = wb_result[result_sheet_name] row_start, row_end = find_row_start(data_file, df, conditions, av, rr, axis, vel, w2t, estop) copy_data_to_result(df, ws_result, row_start, row_end, vel, trq, estop) def copy_data_to_result(df, ws_result, row_start, row_end, vel, trq, estop): # 功能:将数据文件中有效数据拷贝至结果文件对应的 sheet # 参数:如上 # 返回值:- # 结果文件数据清零 data = [] for _row in range(row_start, row_end + 1): data.append(df.iloc[_row, vel-1]) data.append(df.iloc[_row, trq-1]) data.append(df.iloc[_row, estop-1]) i = 0 row_max = 2000 if row_end-row_start < 2000 else row_end-row_start+20 for _row in range(2, row_max): try: ws_result.cell(row=_row, column=1).value = data[i] ws_result.cell(row=_row, column=2).value = data[i+1] ws_result.cell(row=_row, column=3).value = data[i+2] i += 3 except: ws_result.cell(row=_row, column=1).value = None ws_result.cell(row=_row, column=2).value = None ws_result.cell(row=_row, column=3).value = None def find_result_sheet_name(conditions, count): # 功能:获取结果文件准确的sheet页名称 # 参数:臂展和速度的列表 # 返回值:结果文件对应的sheet name # 33%负载_33%速度_1 - ['loadxx', 'reachxx', 'speedxx'] load = conditions[0].removeprefix('load') speed = conditions[2].removeprefix('speed') result_sheet_name = f"{load}%负载_{speed}%速度_{count}" return result_sheet_name def find_row_start(data_file, df, conditions, av, rr, axis, vel, w2t, estop): # 功能:查找数据文件中有效数据的行号,也即最后一个速度下降的点位 # 参数:如上 # 返回值:速度下降点位,最后的数据点位 ratio = float(conditions[2].removeprefix('speed'))/100 av_max = av * ratio row_max = df.index[-1] # threshold = 30 if axis == 2 and conditions[0].removeprefix('load') == '100' else 10 threshold = 0.95 for _row in range(row_max, -1, -1): if df.iloc[_row, estop-1] != 0: row_start = _row-20 if _row-20 > 0 else 0 break else: w2t(f"数据文件 {data_file} 采集的数据中没有 ESTOP 为非 0 的情况,需要确认", 0, 9, 'red') for _row in range(row_start, row_max): speed_row = (df.iloc[_row, vel-1] * 180) / 3.1415926 * rr * 60 / 360 if abs(speed_row) < 1: row_end = _row+100 if _row+100 <= row_max else row_max break else: w2t(f"数据文件 {data_file} 最后的速度未降为零 ", 0, 10, 'red') av_estop = abs((df.iloc[row_start-10:row_start+10, vel-1].abs().mean() * 180) / 3.1415926) if abs(av_estop/av_max) < threshold: filename = data_file.split('\\')[-1] w2t(f"[av_estop: {av_estop:.2f} | shouldbe: {av_max:.2f}] 数据文件 {filename} 触发 ESTOP 时未采集到指定百分比的最大速度,需要检查", 0, 0, '#8A2BE2') return row_start, row_end def traversal_files(path, w2t): # 功能:以列表的形式分别返回指定路径下的文件和文件夹,不包含子目录 # 参数:路径 # 返回值:路径下的文件夹列表 路径下的文件列表 if not exists(path): msg = f'数据文件夹{path}不存在,请确认后重试......' w2t(msg, 0, 1, 'red') else: dirs = [] files = [] for item in scandir(path): if item.is_dir(): dirs.append(item.path) elif item.is_file(): files.append(item.path) return dirs, files def main(path, av, rr, axis, vel, trq, estop, w2t): # 功能:执行处理所有数据文件 # 参数:initialization函数的返回值 # 返回值:- time_start = time() raw_data_dirs, result_files = traversal_files(path, w2t) try: # threads = [] check_files(raw_data_dirs, result_files, w2t) prefix = [] for raw_data_dir in raw_data_dirs: prefix.append(raw_data_dir.split('\\')[-1].split("_")[0]) for result_file in result_files: if result_file.split('\\')[-1].split('_')[0] not in set(prefix): continue else: now_doing_msg(result_file, 'start', w2t) data_process(result_file, raw_data_dirs, av, rr, axis, vel, trq, w2t, estop) # threads.append(Thread(target=data_process, args=(result_file, raw_data_dirs, AV, RR, RC, AXIS))) # [t.start() for t in threads] # [t.join() for t in threads] except Exception as Err: msg = f"出现错误:{Err}\n程序运行错误,请检查配置文件是否准确设定,以及数据文件组织是否正确,也有可能是结果文件损坏,尝试重新复制一份,再运行!" w2t(msg, 0, 11, 'red') w2t("----------------------------------------------------------") w2t("全部处理完毕") time_end = time() time_total = time_end - time_start msg = f"数据处理时间:{time_total // 3600:02.0f} h {time_total % 3600 // 60:02.0f} m {time_total % 60:02.0f} s" w2t(msg) if __name__ == "__main__": stop = 0 main(path=argv[1], av=argv[2], rr=argv[3], axis=argv[4], vel=argv[5], trq=argv[6], estop=argv[7], w2t=argv[8])