Browse Source

append

main
Julin 2 years ago
parent
commit
1132ef28c0
  1. 11
      code/pep-stats-report/Dockerfile
  2. 50
      code/pep-stats-report/app/db_helper.py
  3. 110
      code/pep-stats-report/app/image_helper.py
  4. 2
      code/pep-stats-report/config.ini
  5. 78
      code/pep-stats-report/main.py
  6. 2
      code/pep-stats-report/requirements.txt

11
code/pep-stats-report/Dockerfile

@ -5,7 +5,7 @@ WORKDIR /app
COPY . . COPY . .
RUN pip install --upgrade pip -i http://mirrors.aliyun.com/pypi/simple/ --trusted-host mirrors.aliyun.com && \ RUN pip install --upgrade pip -i http://mirrors.aliyun.com/pypi/simple/ --trusted-host mirrors.aliyun.com && \
pip install -r requirements.txt -i http://mirrors.aliyun.com/pypi/simple/ --trusted-host mirrors.aliyun.com && \ pip install -r requirements_linux.txt -i http://mirrors.aliyun.com/pypi/simple/ --trusted-host mirrors.aliyun.com && \
cp SimHei.ttf /usr/local/lib/python3.8/site-packages/matplotlib/mpl-data/fonts/ttf && \ cp SimHei.ttf /usr/local/lib/python3.8/site-packages/matplotlib/mpl-data/fonts/ttf && \
pyinstaller -F main.py --distpath=. pyinstaller -F main.py --distpath=.
@ -13,6 +13,13 @@ FROM debian:11-slim
WORKDIR /app WORKDIR /app
COPY --from=python_base /app/main /app/config.ini ./ COPY --from=python_base /app/main /app/config.ini /app/SimHei.ttf ./
RUN cp -a /etc/apt/sources.list /etc/apt/sources.list.bak && \
sed -i "s@http://deb.debian.org@http://mirrors.aliyun.com@g" /etc/apt/sources.list && \
sed -i "s@http://security.debian.org@http://mirrors.aliyun.com@g" /etc/apt/sources.list
RUN apt-get update && apt-get install libreoffice -y && \
cp SimHei.ttf /usr/share/fonts/
CMD ["./main"] CMD ["./main"]

50
code/pep-stats-report/app/db_helper.py

@ -1,5 +1,5 @@
def querystring_user_procinst_duration(start, end, except_senior, department): def querystring_user_procinst_duration(start, end, except_senior, department):
filter_user = "and u.name not in ('刘文峰', '金亮', '姜珍', '余莎莎', '张阳根', '唐国华', '刘国勇', '刘会连', '肖琥')" if except_senior else "" filter_user = "and u.name not in ('刘文峰', '金亮', '姜珍', '余莎莎', '张阳根', '唐国华', '刘国勇', '刘会连', '肖琥', '邱峰')" if except_senior else ""
filter_department = "and department_name='{}'".format(department) if department else "" filter_department = "and department_name='{}'".format(department) if department else ""
return ''' return '''
select department_name, select department_name,
@ -34,9 +34,6 @@ group by department_name, user_name, procinst_id
def querystring_senior_procinst_duration(start, end): def querystring_senior_procinst_duration(start, end):
return ''' return '''
SELECT user_name,
ROUND(AVG(procinst_duration_in_minutes) /60, 2) as procinst_duration_in_hours_by_user
from (
select user_name, select user_name,
procinst_id, procinst_id,
sum(duration_in_minutes) as procinst_duration_in_minutes sum(duration_in_minutes) as procinst_duration_in_minutes
@ -56,11 +53,9 @@ from (
inner join workflow_process as wp on wpv.process_id=wp.id inner join workflow_process as wp on wpv.process_id=wp.id
inner join user as u on wpa.deal_user_id=u.id inner join user as u on wpa.deal_user_id=u.id
where wpa.end_time >='{}' and wpa.end_time < '{}' and wp.deleted=false and wp.is_enable=true and u.delete=0 and u.state=1 and u.active_status=1 where wpa.end_time >='{}' and wpa.end_time < '{}' and wp.deleted=false and wp.is_enable=true and u.delete=0 and u.state=1 and u.active_status=1
and u.name in ('刘文峰', '金亮', '姜珍', '余莎莎', '张阳根', '唐国华', '刘国勇', '刘会连', '肖琥') and u.name in ('刘文峰', '金亮', '姜珍', '余莎莎', '张阳根', '唐国华', '刘国勇', '刘会连', '肖琥', '邱峰')
) as r ) as r
group by user_name, procinst_id group by user_name, procinst_id
) as r2
GROUP by r2.user_name
'''.format(start, end) '''.format(start, end)
@ -139,14 +134,22 @@ order by procinst_duration_in_hours_by_department DESC
def querystring_procinst_duration_by_senior(start, end): def querystring_procinst_duration_by_senior(start, end):
return ''' return '''
SELECT ROUND(AVG(procinst_duration_in_hours_by_user), 2) as procinst_duration_in_hours_by_department SELECT ROUND(AVG(procinst_duration_in_hours_by_user), 2) as procinst_duration_in_hours_by_department
from ({}) as r3 from (
SELECT user_name,
ROUND(AVG(procinst_duration_in_minutes) /60, 2) as procinst_duration_in_hours_by_user
from ({}) as r2
GROUP by r2.user_name
) as r3
'''.format(querystring_senior_procinst_duration(start, end)) '''.format(querystring_senior_procinst_duration(start, end))
# 用户单流程处理耗时(高管) # 用户单流程处理耗时(高管)
def querystring_procinst_duration_by_user_senior(start, end): def querystring_procinst_duration_by_user_senior(start, end):
return ''' return '''
{} SELECT user_name,
ROUND(AVG(procinst_duration_in_minutes) /60, 2) as procinst_duration_in_hours_by_user
from ({}) as r2
GROUP by r2.user_name
order by procinst_duration_in_hours_by_user DESC order by procinst_duration_in_hours_by_user DESC
'''.format(querystring_senior_procinst_duration(start, end)) '''.format(querystring_senior_procinst_duration(start, end))
@ -154,7 +157,12 @@ order by procinst_duration_in_hours_by_user DESC
# 各部门耗时较长用户(高管) # 各部门耗时较长用户(高管)
def querystring_user_gt_senior_avg(start, end, avg): def querystring_user_gt_senior_avg(start, end, avg):
return ''' return '''
SELECT * from ({}) as r3 SELECT * from (
SELECT user_name,
ROUND(AVG(procinst_duration_in_minutes) /60, 2) as procinst_duration_in_hours_by_user
from ({}) as r2
GROUP by r2.user_name
) as r3
WHERE r3.procinst_duration_in_hours_by_user > {} WHERE r3.procinst_duration_in_hours_by_user > {}
order by procinst_duration_in_hours_by_user DESC order by procinst_duration_in_hours_by_user DESC
'''.format(querystring_senior_procinst_duration(start, end), avg) '''.format(querystring_senior_procinst_duration(start, end), avg)
@ -178,8 +186,28 @@ order by procinst_duration_in_hours_by_user desc
def querystring_procinst_duration_by_user(start, end, department): def querystring_procinst_duration_by_user(start, end, department):
return """ return """
SELECT user_name, SELECT user_name,
ROUND(AVG(procinst_duration_in_minutes) /60, 2) as procinst_duration_in_hours_by_user ROUND(AVG(procinst_duration_in_minutes) /60, 2) as procinst_duration_in_hours_by_user
from ({}) as r2 from ({}) as r2
group by r2.user_name group by r2.user_name
order by procinst_duration_in_hours_by_user DESC order by procinst_duration_in_hours_by_user DESC
""".format(querystring_user_procinst_duration(start, end, True, department)) """.format(querystring_user_procinst_duration(start, end, True, department))
# 按部门统计用户处理流程数量
def querystring_procinst_count_by_user(start, end, department):
return '''
SELECT user_name,
COUNT(*) as procinst_count_by_user
from ({}) as r2
group by r2.user_name
'''.format(querystring_user_procinst_duration(start, end, True, department))
# 用户处理流程数量(高管)
def querystring_procinst_count_by_senior(start, end):
return '''
SELECT user_name,
COUNT(*) as procinst_count_by_user
from ({}) as r2
group by r2.user_name
'''.format(querystring_senior_procinst_duration(start, end))

110
code/pep-stats-report/app/image_helper.py

@ -0,0 +1,110 @@
import platform
import os
import fitz # pip install PyMuPDF
from PIL import Image
import shutil
import logging
# 将word文件转换成pdf文件
def word2pdf(word_file):
from win32com import client # pip install pywin32
# 获取word格式处理对象
word = client.Dispatch('Word.Application')
# 以Doc对象打开文件
doc_ = word.Documents.Open(word_file)
# 另存为pdf文件
pdf_file = word_file.replace(os.path.basename(word_file).split('.')[1], "pdf")
doc_.SaveAs(pdf_file, FileFormat=17)
logging.info(f'{word_file} ----转pdf成功')
# 关闭doc对象
doc_.Close()
# 退出word对象
word.Quit()
return pdf_file
# 将word文件转换成pdf文件(Linux)
def word2pdf_linux(word_file):
word_path = os.path.dirname(word_file)
os.system(f"libreoffice --headless --language=zh-CN --convert-to pdf {word_file} --outdir {word_path}")
logging.info(f'{word_file} ----转pdf成功')
pdf_file = word_file.replace(os.path.basename(word_file).split('.')[1], "pdf")
return pdf_file
# pdf转图片
def pdf2png(pdf_file):
image_path = os.path.abspath(f'{os.path.dirname(pdf_file)}/tmp_pdf2png')
try:
# 创建一个空白图片,用于拼接内容
width, height = 0, 0
images = []
pdf_doc = fitz.open(pdf_file)
for pg in range(pdf_doc.page_count):
page = pdf_doc[pg]
rotate = int(0)
# 每个尺寸的缩放系数为1.3,这将为我们生成分辨率提高2.6的图像。
# 此处若是不做设置,默认图片大小为:792X612, dpi=96
zoom_x = 1.33333333 # (1.33333333-->1056x816) (2-->1584x1224)
zoom_y = 1.33333333
mat = fitz.Matrix(zoom_x, zoom_y).prerotate(rotate)
pix = page.get_pixmap(matrix=mat, alpha=False)
if not os.path.exists(image_path): # 判断存放图片的文件夹是否存在
os.makedirs(image_path) # 若图片文件夹不存在就创建
pix.save(image_path + '/' + 'tmp%s.png' % pg) # 将图片写入指定的文件夹内
img = Image.open(image_path + '/' + 'tmp%s.png' % pg)
img_width, img_height = img.size
# 更新拼接图片的宽度和高度
width = max(width, img_width)
height += img_height
# 添加图片到拼接列表
images.append(img)
# 创建一个空白长图
long_image = Image.new('RGB', (width, height), (255, 255, 255))
y_offset = 0
# 将每张图片拼接到长图中
for img in images:
long_image.paste(img, (0, y_offset))
y_offset += img.height
# 保存拼接后的长图
png_file = pdf_file.replace(os.path.basename(pdf_file).split('.')[1], "png")
long_image.save(png_file)
# 删除中间临时保存的图片
shutil.rmtree(image_path)
except IOError as error:
logging.error('pdf转png失败')
raise error
else:
logging.info("pdf转png成功")
return png_file
def word_to_long_image(word_file_path):
try:
_file = os.path.abspath(word_file_path) # os.path.abspath('input.docx')
if platform.system().lower() == 'windows':
pdf_file = word2pdf(_file)
else:
pdf_file = word2pdf_linux(_file)
png_file = pdf2png(pdf_file)
# 删除中间保存的pdf文件
os.remove(pdf_file)
return png_file
except Exception as error:
logging.error('word转长图出错:{}'.format(error))
raise error

2
code/pep-stats-report/config.ini

@ -3,7 +3,7 @@ host = 10.8.30.161
port = 30900 port = 30900
username = default username = default
password = password =
database = pepca_m database = pepca9
[qiniu] [qiniu]
access-key=5XrM4wEB9YU6RQwT64sPzzE6cYFKZgssdP5Kj3uu access-key=5XrM4wEB9YU6RQwT64sPzzE6cYFKZgssdP5Kj3uu

78
code/pep-stats-report/main.py

@ -7,7 +7,8 @@ from docx.shared import Inches, Pt, RGBColor
from docx.enum.text import WD_PARAGRAPH_ALIGNMENT, WD_LINE_SPACING from docx.enum.text import WD_PARAGRAPH_ALIGNMENT, WD_LINE_SPACING
from docx.oxml.ns import qn from docx.oxml.ns import qn
import matplotlib.pyplot as plt import matplotlib.pyplot as plt
from app import db_helper import numpy as np
from app import db_helper, image_helper
import qiniu import qiniu
import logging import logging
@ -107,6 +108,43 @@ def create_bar_chart(doc, x, y, mean, title, filename):
r.add_picture('{}/{}'.format(REPORT_DIR, filename), width=Inches(6)) r.add_picture('{}/{}'.format(REPORT_DIR, filename), width=Inches(6))
def create_bar_twinx_chart(doc, x, y1, y2, mean, title, filename):
plt.rcParams["font.sans-serif"] = ["SimHei"] # 设置字体
plt.rcParams["axes.unicode_minus"] = False # 正常显示负号
x_range = np.arange(len(x))
width = 0.25 # the width of the bars
fig, ax1 = plt.subplots()
ax1.set_ylabel('耗时')
rects = ax1.bar(x_range, y1, width, color=(31 / 255, 168 / 255, 201 / 255), label='耗时')
ax1.bar_label(rects, padding=3)
ax1.set_xticks(x_range + width / 2, x)
# 设置x轴标签旋转角度
plt.xticks(rotation=-30, ha='left')
# 绘制均值线
plt.axhline(mean, linestyle='dashed', color='#FF8C00', label=f'均值:{mean}')
ax2 = ax1.twinx() # instantiate a second axes that shares the same x-axis
ax2.set_ylabel('流程数')
rects = ax2.bar(x_range + width, y2, width, color='#5AC189', label='流程数')
ax2.bar_label(rects, padding=3)
plt.title(title)
fig.legend(loc='upper right', ncols=1, bbox_to_anchor=(1, 1), bbox_transform=ax1.transAxes)
fig.tight_layout() # otherwise the right y-label is slightly clipped
# 保存图形
plt.savefig('{}/{}'.format(REPORT_DIR, filename))
plt.close()
# 插入图形到 Word 文档中
p = doc.add_paragraph()
p.alignment = WD_PARAGRAPH_ALIGNMENT.CENTER
r = p.add_run()
r.add_picture('{}/{}'.format(REPORT_DIR, filename), width=Inches(6))
def add_section(doc, rank, department, d_elapse): def add_section(doc, rank, department, d_elapse):
h = doc.add_heading(level=2) h = doc.add_heading(level=2)
r = h.add_run('{}. {}'.format(rank, department)) r = h.add_run('{}. {}'.format(rank, department))
@ -124,6 +162,12 @@ def add_section(doc, rank, department, d_elapse):
) if department == '高管' else db_helper.querystring_procinst_duration_by_user( ) if department == '高管' else db_helper.querystring_procinst_duration_by_user(
start_time, end_time, department) start_time, end_time, department)
procinst_duration_by_user = client.execute(qs) procinst_duration_by_user = client.execute(qs)
qs = db_helper.querystring_procinst_count_by_senior(
start_time, end_time
) if department == '高管' else db_helper.querystring_procinst_count_by_user(
start_time, end_time, department)
procinst_count_by_user = client.execute(qs)
except Exception as error: except Exception as error:
print('数据库查询错误:', error) print('数据库查询错误:', error)
logging.error('数据库查询错误:{}'.format(error)) logging.error('数据库查询错误:{}'.format(error))
@ -149,11 +193,20 @@ def add_section(doc, rank, department, d_elapse):
set_paragraph_format(p) set_paragraph_format(p)
x = [] x = []
y = [] y1 = []
y2 = []
for user, elapse in procinst_duration_by_user: for user, elapse in procinst_duration_by_user:
x.append(user) x.append(user)
y.append(elapse) y1.append(elapse)
create_bar_chart(doc, x, y, d_elapse, "个人流程处理平均耗时", "{}-流程处理平均耗时.png".format(department))
for name in x:
for user, count in procinst_count_by_user:
if user == name:
y2.append(count)
break
create_bar_twinx_chart(doc, x, y1, y2, d_elapse, "个人流程处理平均耗时", "{}-流程处理平均耗时.png".format(department))
caption = doc.add_paragraph('图 2-{} {}个人处理流程平均耗时'.format(rank, department)) caption = doc.add_paragraph('图 2-{} {}个人处理流程平均耗时'.format(rank, department))
caption.alignment = WD_PARAGRAPH_ALIGNMENT.CENTER caption.alignment = WD_PARAGRAPH_ALIGNMENT.CENTER
@ -193,7 +246,7 @@ def add_chapter_1(doc):
logging.error('数据库查询错误:{}'.format(error)) logging.error('数据库查询错误:{}'.format(error))
raise RuntimeError('数据库查询错误:', error) raise RuntimeError('数据库查询错误:', error)
if procinst_duration_by_senior > procinst_duration_by_company: if procinst_duration_by_senior is not None and procinst_duration_by_senior > procinst_duration_by_company:
department_count_gt_avg += 1 department_count_gt_avg += 1
p = doc.add_paragraph() p = doc.add_paragraph()
@ -289,12 +342,17 @@ def generate_word_report():
set_paragraph_format(p_last) set_paragraph_format(p_last)
# 保存文档 # 保存文档
report_path = '{}/项企流程效能分析结果公示(全员)-{}{}月.docx'.format(REPORT_DIR, last_year, last_month) report_file_name = '项企流程效能分析结果公示(全员)-{}{}月.docx'.format(last_year, last_month)
doc.save(report_path) report_file = f'{REPORT_DIR}/{report_file_name}'
logging.info('本地报表创建成功:{}'.format(report_path)) doc.save(report_file)
logging.info('本地报表创建成功:{}'.format(report_file))
# 将文档转换为图片
png_file = image_helper.word_to_long_image(report_file)
# 上传七牛云 # 上传七牛云
upload_to_qiniu('项企流程效能分析结果公示(全员)-{}{}月.docx'.format(last_year, last_month)) upload_to_qiniu(report_file_name)
upload_to_qiniu(os.path.basename(png_file))
def create_clickhouse_client(): def create_clickhouse_client():
@ -343,7 +401,7 @@ if __name__ == '__main__':
procinst_duration_by_senior = client.execute(qs3)[0][0] procinst_duration_by_senior = client.execute(qs3)[0][0]
for index, (department, elapse) in enumerate(procinst_duration_by_department): for index, (department, elapse) in enumerate(procinst_duration_by_department):
if procinst_duration_by_senior >= elapse: if procinst_duration_by_senior is not None and procinst_duration_by_senior >= elapse:
procinst_duration_by_department.insert(index, ('高管', procinst_duration_by_senior)) procinst_duration_by_department.insert(index, ('高管', procinst_duration_by_senior))
break break

2
code/pep-stats-report/requirements.txt

@ -19,11 +19,13 @@ pefile==2023.2.7
Pillow==9.5.0 Pillow==9.5.0
pyinstaller==5.10.1 pyinstaller==5.10.1
pyinstaller-hooks-contrib==2023.2 pyinstaller-hooks-contrib==2023.2
PyMuPDF==1.22.3
pyparsing==3.0.9 pyparsing==3.0.9
python-dateutil==2.8.2 python-dateutil==2.8.2
python-docx==0.8.11 python-docx==0.8.11
pytz==2023.3 pytz==2023.3
pytz-deprecation-shim==0.1.0.post0 pytz-deprecation-shim==0.1.0.post0
pywin32==306
pywin32-ctypes==0.2.0 pywin32-ctypes==0.2.0
qiniu==7.10.0 qiniu==7.10.0
requests==2.28.2 requests==2.28.2

Loading…
Cancel
Save