python 文本处理与tkinter入门

Posted on July 29, 2021August 1, 2021Front End, Python

工作需要，得开发一些带GUI的小工具
在此记录下踩的坑

源码

使用from ... import ...是为了尽量减小打包后文件的大小
文中和Canvas, PhotoImage, ico, bitmap有关的语句也是为了减小打包后exe尺寸而注释掉的。

# import tkinter as tk
# from tkinter import Canvas, Label, StringVar, Entry, Button, Tk, PhotoImage, messagebox
from tkinter import Label, StringVar, Entry, Button, Tk, messagebox

# 窗口居中显示函数
def center_window(root, width, height):
  screenwidth = root.winfo_screenwidth()
  screenheight = root.winfo_screenheight()
  size = &#039;%dx%d+%d+%d&#039; % (width, height, (screenwidth - width) / 2, (screenheight - height) / 2)
  # print(size)
  root.geometry(size)
  root.update()
  # print(root.winfo_x())

# 创建窗口
window = Tk()
window.title(&#039;文本自动划分软件 2.0&#039;)
# window.geometry(&#039;500x200+1000+500&#039;) # 宽500， 高200，距左边1000，距上边500
center_window(window, 280, 200)
# ico_file = r&#039;./TaiJi.ico&#039;# 载入图标ico文件
# window.iconbitmap(bitmap=ico_file) # 设置窗口图标

###创建logo
##canvas = Canvas(window, height=150, width=150) # 创建画布
##img_file = PhotoImage(file=r&#039;./Tai_Ji_Animation.gif&#039;) # 读取图片文件，只支持gif
##img = canvas.create_image(0,0, anchor=&#039;nw&#039;, image = img_file) # 放置图片于画布上, anchor后是按照方位表示的锚点位置
##canvas.pack(side=&#039;top&#039;) # 放置画布

# 创建标签
Label(window, text=&#039;文件名：&#039;).place(x=50, y= 50)
Label(window, text=&#039;(.txt)&#039;).place(x=200, y= 50)
note = &#039;&#039;&#039;说明：待转换文件和该程序
          需在同一文件中&#039;&#039;&#039;
Label(window, text=note).place(x=50, y= 80)

# 变量赋值
var_file_name = StringVar()
var_file_name.set(&#039;1000&#039;)
# 创建文件名输入示例
entry_file_name = Entry(window, textvariable=var_file_name, width=10)
entry_file_name.place(x=100, y=50)

# 文本转换代码（需要放在按钮前，以供按钮调用）
def text_convert():

  try:
    name = entry_file_name.get() # 读取entry框中的文本内容

    # open file readlines and save each line as a entity in data (type:list)
    with open(r&#039;./&#039;+name+&#039;.txt&#039;, &#039;r&#039;) as f:
        data = f.readlines()

    # delete the row changing sign at the end of each row
    data = [i.strip(&#039;\n\t&#039;) for i in data]

    #  a new list to hold concated data
    smpl = []
    mod = len(data)//30 # the largest integer

    for i in range(mod):
        smpl.append(&#039;##&#039;.join(data[i*30:i*30+29]))

    smpl.append(&#039;##&#039;.join(data[mod*30:len(data)])) # put rest info to the last line

    smpl = [&#039;======【第&#039;+str(smpl.index(line)+1)+&#039;行】======\n&#039;+line+&#039;\r&#039; for line in smpl] # &#039;\r\n&#039; both stand for a new line

    with open(r&#039;./&#039;+name+&#039;_30.txt&#039;,&#039;w&#039;) as f:
        f.writelines(smpl)

    messagebox.showinfo(title=&#039;Done&#039;, message=&#039;转换完成，共转换数据&#039;+str(len(data))+&#039;条\n结果文件名为&#039;+name+&#039;_30.txt&#039;)

  except FileNotFoundError: #　未找到文件时报错
    messagebox.showerror(title=&#039;Error&#039;, message=&#039;该文件夹中未找到&#039;+name+&#039;.txt\n&#039;)

# 运行按钮
btn_run = Button(window, text=&#039;开始转换&#039;, command=text_convert)#定义一个`button`按钮，名为`开始转换`,触发命令为`text_convert`
btn_run.place(x=110, y=120)

# 如果不加这条，打包后的exe窗口会闪退
window.mainloop()
print(&#039;sucessfully run&#039;)

# import tkinter as tk

# from tkinter import Canvas, Label, StringVar, Entry, Button, Tk, PhotoImage, messagebox

from tkinter import Label, StringVar, Entry, Button, Tk, messagebox

# 窗口居中显示函数

def center_window(root, width, height):

screenwidth = root.winfo_screenwidth()

screenheight = root.winfo_screenheight()

size = '%dx%d+%d+%d' % (width, height, (screenwidth - width) / 2, (screenheight - height) / 2)

# print(size)

root.geometry(size)

root.update()

# print(root.winfo_x())

# 创建窗口

window = Tk()

window.title('文本自动划分软件 2.0')

# window.geometry('500x200+1000+500') # 宽500，高200，距左边1000，距上边500

center_window(window, 280, 200)

# ico_file = r'./TaiJi.ico'# 载入图标ico文件

# window.iconbitmap(bitmap=ico_file) # 设置窗口图标

###创建logo

##canvas = Canvas(window, height=150, width=150) # 创建画布

##img_file = PhotoImage(file=r'./Tai_Ji_Animation.gif') # 读取图片文件，只支持gif

##img = canvas.create_image(0,0, anchor='nw', image = img_file) # 放置图片于画布上, anchor后是按照方位表示的锚点位置

##canvas.pack(side='top') # 放置画布

# 创建标签

Label(window, text='文件名：').place(x=50, y= 50)

Label(window, text='(.txt)').place(x=200, y= 50)

note = '''说明：待转换文件和该程序

需在同一文件中'''

Label(window, text=note).place(x=50, y= 80)

# 变量赋值

var_file_name = StringVar()

var_file_name.set('1000')

# 创建文件名输入示例

entry_file_name = Entry(window, textvariable=var_file_name, width=10)

entry_file_name.place(x=100, y=50)

# 文本转换代码（需要放在按钮前，以供按钮调用）

def text_convert():

try:

name = entry_file_name.get() # 读取entry框中的文本内容

# open file readlines and save each line as a entity in data (type:list)

with open(r'./'+name+'.txt', 'r') as f:

data = f.readlines()

# delete the row changing sign at the end of each row

data = [i.strip('\n\t') for i in data]

# a new list to hold concated data

smpl = []

mod = len(data)//30 # the largest integer

for i in range(mod):

smpl.append('##'.join(data[i*30:i*30+29]))

smpl.append('##'.join(data[mod*30:len(data)])) # put rest info to the last line

smpl = ['======【第'+str(smpl.index(line)+1)+'行】======\n'+line+'\r' for line in smpl] # '\r\n' both stand for a new line

with open(r'./'+name+'_30.txt','w') as f:

f.writelines(smpl)

messagebox.showinfo(title='Done', message='转换完成，共转换数据'+str(len(data))+'条\n结果文件名为'+name+'_30.txt')

except FileNotFoundError: #　未找到文件时报错

messagebox.showerror(title='Error', message='该文件夹中未找到'+name+'.txt\n')

# 运行按钮

btn_run = Button(window, text='开始转换', command=text_convert)#定义一个`button`按钮，名为`开始转换`,触发命令为`text_convert`

btn_run.place(x=110, y=120)

# 如果不加这条，打包后的exe窗口会闪退

window.mainloop()

print('sucessfully run')

参考网站：

感谢知识分享！

二次更新

增加csv对比模块
本来是用xlsx，但是pandas和openpyxl的打包一直无法成功，为此还自己写了CMD脚本
于是想到用csv，恰好python可以不借助其他包读写csv，因此快速试试。
亮点：

多次使用一行代码实现遍历处理，例如lambda函数的使用
利用index返回索引，读取csv中对应位置的信息
try, except的丰富

top_y_2 = 140

Label(window, text=&#039;数据库：&#039;).place(x=50, y= top_y_2)
Label(window, text=&#039;(.txt)&#039;).place(x=200, y= top_y_2)
var_ref_name = StringVar()
var_ref_name.set(&#039;200&#039;)
entry_ref_name = Entry(window, textvariable=var_ref_name, width=10)
entry_ref_name.place(x=100, y=top_y_2)

Label(window, text=&#039;待对比：&#039;).place(x=50, y= top_y_2+30)
Label(window, text=&#039;(.csv)&#039;).place(x=200, y= top_y_2+30)
var_ln_name = StringVar()
var_ln_name.set(&#039;测试&#039;)
entry_ln_name = Entry(window, textvariable=var_ln_name, width=10)
entry_ln_name.place(x=100, y=top_y_2+30)

def examine():

  ref_name = entry_ref_name.get()
  ln_name = entry_ln_name.get()

  try:
    with open(&#039;./&#039;+str(ref_name)+&#039;.txt&#039;,&#039;r&#039;,encoding=&#039;utf-8&#039;) as f:
      refs = [ref.strip(&#039;\n&#039;) for ref in f.readlines()] # 逐行读取并消除首尾字符

    with open(&#039;./&#039;+str(ln_name)+&#039;.csv&#039;,&#039;r&#039;,encoding=&#039;utf-8&#039;) as f:
      lines = [line.strip(&#039;\n&#039;) for line in f.readlines()]

    # 读取各行逗号索引值
    # 截取微信号列，+1以跳过开头逗号
    idxes = [[i for i,s in enumerate(line) if s==&#039;,&#039;] for line in lines]
    numbers = [line[idx[0]+1:idx[1]] for idx, line in zip(idxes,lines)] 

    judge = lambda x:x if x in refs else &#039;&#039; # 单独定义比较函数
    sames = [judge(number) for number in numbers]
    sames[0] = &#039;重复项&#039; #　补个header

    outs = [line+same+&#039;,\n&#039; for line,same in zip(lines, sames)]
    with open(&#039;./&#039;+str(ln_name)+&#039;_1&#039;+&#039;.csv&#039;,&#039;w&#039;,encoding=&#039;utf-8&#039;) as f:
        f.writelines(outs)

    messagebox.showinfo(title=&#039;Done&#039;, message=
                        &#039;参考给出的&#039;+str(len(refs))+&#039;条数据\n&#039;
                        +&#039;本次筛选的&#039;+str(len(lines)-lines.count(&#039;&#039;))+&#039;条的数据中\n&#039;
                        +&#039;包含重复数据&#039;+str(len(sames)-sames.count(&#039;&#039;))+&#039;条\n&#039;
                        +&#039;处理结果保存至“&#039;+str(ln_name)+&#039;_1&#039;+&#039;.csv”中&#039;)

  except FileNotFoundError:
    messagebox.showerror(title=&#039;Error&#039;, message=&#039;该文件夹中未找到“&#039;+ref_name+&#039;.txt”\n&#039;+&#039;或“&#039;+ln_name+&#039;.csv”&#039;)

  except Exception as e:
    messagebox.showerror(title=&#039;Error&#039;, message=&#039;错误类型：“&#039;+str(e)+&#039;”\n错误日志已自动保存至该文件夹“error_log.txt”中\n请联系开发者并发送该报告&#039;)
    with open(&#039;./error_log&#039;+&#039;.txt&#039;,&#039;w&#039;,encoding=&#039;utf-8&#039;) as f:
        f.writelines(str(e))

# 运行按钮
btn_run = Button(window, text=&#039;开始筛选&#039;, command=examine)
btn_run.place(x=110, y=top_y_2+60)

top_y_2 = 140

Label(window, text='数据库：').place(x=50, y= top_y_2)

Label(window, text='(.txt)').place(x=200, y= top_y_2)

var_ref_name = StringVar()

var_ref_name.set('200')

entry_ref_name = Entry(window, textvariable=var_ref_name, width=10)

entry_ref_name.place(x=100, y=top_y_2)

Label(window, text='待对比：').place(x=50, y= top_y_2+30)

Label(window, text='(.csv)').place(x=200, y= top_y_2+30)

var_ln_name = StringVar()

var_ln_name.set('测试')

entry_ln_name = Entry(window, textvariable=var_ln_name, width=10)

entry_ln_name.place(x=100, y=top_y_2+30)

def examine():

ref_name = entry_ref_name.get()

ln_name = entry_ln_name.get()

try:

with open('./'+str(ref_name)+'.txt','r',encoding='utf-8') as f:

refs = [ref.strip('\n') for ref in f.readlines()] # 逐行读取并消除首尾字符

with open('./'+str(ln_name)+'.csv','r',encoding='utf-8') as f:

lines = [line.strip('\n') for line in f.readlines()]

# 读取各行逗号索引值

# 截取微信号列，+1以跳过开头逗号

idxes = [[i for i,s in enumerate(line) if s==','] for line in lines]

numbers = [line[idx[0]+1:idx[1]] for idx, line in zip(idxes,lines)]

judge = lambda x:x if x in refs else '' # 单独定义比较函数

sames = [judge(number) for number in numbers]

sames[0] = '重复项' #　补个header

outs = [line+same+',\n' for line,same in zip(lines, sames)]

with open('./'+str(ln_name)+'_1'+'.csv','w',encoding='utf-8') as f:

f.writelines(outs)

messagebox.showinfo(title='Done', message=

'参考给出的'+str(len(refs))+'条数据\n'

+'本次筛选的'+str(len(lines)-lines.count(''))+'条的数据中\n'

+'包含重复数据'+str(len(sames)-sames.count(''))+'条\n'

+'处理结果保存至“'+str(ln_name)+'_1'+'.csv”中')

except FileNotFoundError:

messagebox.showerror(title='Error', message='该文件夹中未找到“'+ref_name+'.txt”\n'+'或“'+ln_name+'.csv”')

except Exception as e:

messagebox.showerror(title='Error', message='错误类型：“'+str(e)+'”\n错误日志已自动保存至该文件夹“error_log.txt”中\n请联系开发者并发送该报告')

with open('./error_log'+'.txt','w',encoding='utf-8') as f:

f.writelines(str(e))

# 运行按钮

btn_run = Button(window, text='开始筛选', command=examine)

btn_run.place(x=110, y=top_y_2+60)

写的两个bat批处理文件：

pyinstaller自动安装

call activate text_3.6 D: cd XYX\TMP\XiongXi\0731_Data pyinstaller -F -w TC-4.0.1.py -i hd.ico pause exit

1
2
3
4
5
6

call activate text_3.6
D:
cd XYX\TMP\XiongXi\0731_Data
pyinstaller -F -w TC-4.0.1.py -i hd.ico
pause
exit
运行并记录日志

D: cd XYX\TMP\XiongXi\0731_Data\dist TC_2.exe>log.txt 2>&1 pause exit

1
2
3
4
5

D:
cd XYX\TMP\XiongXi\0731_Data\dist
TC_2.exe>log.txt 2>&1
pause
exit
自动创建环境并安装所需库
这里尝试3.6和3.8是因为看到github讨论中说pyinstaller对3.7的支持兼容不好

conda create python=3.6 -n text_3.6 pandas pyinstaller -y conda create python=3.8 -n text_3.8 pandas pyinstaller -y

1
2

conda create python=3.6 -n text_3.6 pandas pyinstaller -y
conda create python=3.8 -n text_3.8 pandas pyinstaller -y

其他

pyinstaller打包图标不变，可能由于explore.exe有缓存，或是由于ico对应不同尺寸的图标
如果无需担心两个集合内部的顺序，可以用【set】，考虑顺序，还是建议上述方法。

源码

参考网站：

二次更新

其他

Leave a Reply Cancel reply