This commit is contained in:
2026-01-08 12:19:44 +08:00
parent fd43e303fa
commit b8fea19fc3
4 changed files with 20 additions and 4 deletions

View File

@@ -1,7 +1,7 @@
[metadata] [metadata]
# replace with your username: # replace with your username:
name = guan name = guan
version = 0.1.196 version = 0.1.198
author = guanjihuan author = guanjihuan
author_email = guanjihuan@163.com author_email = guanjihuan@163.com
description = An open source python package description = An open source python package

View File

@@ -1,6 +1,6 @@
Metadata-Version: 2.4 Metadata-Version: 2.4
Name: guan Name: guan
Version: 0.1.196 Version: 0.1.198
Summary: An open source python package Summary: An open source python package
Home-page: https://py.guanjihuan.com Home-page: https://py.guanjihuan.com
Author: guanjihuan Author: guanjihuan

View File

@@ -471,7 +471,7 @@ def open_file(filename='a', file_format='.txt', mode='add'):
f = open(filename+file_format, 'w', encoding='UTF-8') f = open(filename+file_format, 'w', encoding='UTF-8')
return f return f
# 打印到TXT文件 # 打印到TXT文件(补充内容)
def print_to_file(*args, filename='print_result', file_format='.txt', print_on=True): def print_to_file(*args, filename='print_result', file_format='.txt', print_on=True):
if print_on==True: if print_on==True:
for arg in args: for arg in args:
@@ -483,7 +483,12 @@ def print_to_file(*args, filename='print_result', file_format='.txt', print_on=T
f.write('\n') f.write('\n')
f.close() f.close()
# 读取文本文件内容。如果文件不存在,返回空字符串 # 写入到文本文件(覆盖内容)
def write_text_file(content, filename='a', file_format='.txt'):
with open(filename+file_format, 'w', encoding='UTF-8') as f:
f.write(content)
# 读取文本文件内容(如果文件不存在,返回空字符串)
def read_text_file(file_path='./a.txt', make_file=None): def read_text_file(file_path='./a.txt', make_file=None):
import os import os
if not os.path.exists(file_path): if not os.path.exists(file_path):

View File

@@ -28,6 +28,17 @@ def combine_two_pdf_files(input_file_1='a.pdf', input_file_2='b.pdf', output_fil
with open(output_file, 'wb') as combined_file: with open(output_file, 'wb') as combined_file:
output_pdf.write(combined_file) output_pdf.write(combined_file)
# 使用pdfplumber将PDF文件转成文本
def pdf_to_text_with_pdfplumber(pdf_path):
import pdfplumber
with pdfplumber.open(pdf_path) as pdf:
all_text = []
for page in pdf.pages:
text = page.extract_text()
all_text.append(text)
content = "\n\n".join(all_text)
return content
# 使用pdfminer3k将PDF文件转成文本 # 使用pdfminer3k将PDF文件转成文本
def pdf_to_text_with_pdfminer3k(pdf_path): def pdf_to_text_with_pdfminer3k(pdf_path):
from pdfminer.pdfparser import PDFParser, PDFDocument from pdfminer.pdfparser import PDFParser, PDFDocument