# 新建文档

In [36]:
from docx import Document
from docx.shared import Inches

document = Document()

#添加标题，并设置级别，范围：0 至 9，默认为1
document.add_heading('Document Title', 0)

#添加段落，文本可以包含制表符（\t）、换行符（\n）或回车符（\r）等
p = document.add_paragraph('          我是谁 ')
#在段落后面追加文本，并可设置样式
p.add_run('bold').bold = True
p.add_run(' and some ')
p.add_run('italic.').italic = True

document.add_heading('Heading, level 1', level=1)
document.add_paragraph('Intense quote', style='Intense Quote')

#添加项目列表（前面一个小圆点）
document.add_paragraph(
    'first item in unordered list', style='List Bullet'
)
document.add_paragraph('second item in unordered list', style='List Bullet')

#添加项目列表（前面数字）
document.add_paragraph('first item in ordered list', style='List Number')
document.add_paragraph('second item in ordered list', style='List Number')

#添加图片
document.add_picture('wind_rank.jpg', width=Inches(5))

records = (
    (3, '101', 'Spam'),
    (7, '422', 'Eggs'),
    (4, '631', 'Spam, spam, eggs, and spam')
)

#添加表格：一行三列
# 表格样式参数可选：
# Normal Table
# Table Grid
# Light Shading、 Light Shading Accent 1 至 Light Shading Accent 6
# Light List、Light List Accent 1 至 Light List Accent 6
# Light Grid、Light Grid Accent 1 至 Light Grid Accent 6
# 太多了其它省略...
table = document.add_table(rows=1, cols=3, style='Light Shading Accent 2')
#获取第一行的单元格列表
hdr_cells = table.rows[0].cells
#下面三行设置上面第一行的三个单元格的文本值
hdr_cells[0].text = 'Qty'
hdr_cells[1].text = 'Id'
hdr_cells[2].text = 'Desc'
for qty, id, desc in records:
    #表格添加行，并返回行所在的单元格列表
    row_cells = table.add_row().cells
    row_cells[0].text = str(qty)
    row_cells[1].text = id
    row_cells[2].text = desc

document.add_page_break()

# #保存.docx文档
document.save('demo.docx')

In [None]:
#!/usr/bin/python
# coding=UTF-8

from docx import Document
from docx.shared import RGBColor
from docx.enum.text import WD_ALIGN_PARAGRAPH
from docx.shared import  Pt
from docx.oxml import OxmlElement
from docx.oxml.ns import  qn
from docx.shared import Inches
from docx.shared import Cm
#打开文档
document = Document()

#报告标题
head = document.add_heading()
head.paragraph_format.alignment = WD_ALIGN_PARAGRAPH.CENTER
head.paragraph_format.space_before = Pt(36)
run = head.add_run(u"生成的报告")
run.font.size=Pt(36)
run.font.color.rgb=RGBColor(0x00,0x00,0x00) #标题颜色
document.styles['Normal'].font.name = u'Times New Roman' #设置西文字体
document.styles['Normal']._element.rPr.rFonts.set(qn('w:eastAsia'), u'宋体') #设置中文字体使用字体2->宋体
#添加分页
document.add_page_break()

#二级标题
head2 = document.add_heading(level=2)
head2.paragraph_format.alignment = WD_ALIGN_PARAGRAPH.CENTER
run = head2.add_run(u'报告分析')
#run.font.name=u'宋体'
run.font.size=Pt(21)
run.font.color.rgb=RGBColor(14,106,85)
#段落后行距
head2.paragraph_format.space_after = Pt(30)

#二级级标题段落
#document.styles['Normal'].font.name = u'宋体'
p = document.add_paragraph()
run = p.add_run(u'''    段落1
    段落2''')
run.font.color.rgb = RGBColor(0, 0, 0)
run.font.size = Pt(15)
#单倍行距
p.paragraph_format.line_spacing = Pt(30)
#段落后行距
p.paragraph_format.space_after = Pt(30)

#三级标题
head3 = document.add_heading(level=3)
run = head3.add_run(u'分析对象:')
#run.font.name=u'宋体'
run.font.size=Pt(18)
run.font.color.rgb=RGBColor(0,0,0)
#段落后行距
head2.paragraph_format.space_after = Pt(30)
#基本信息
document.add_picture('./image/1.png', width=Cm(15.24)) #设置图片大小，这里用的是cm厘米，比较直观吧，反正我从来不懂Inches跟cm之间怎么换，也不知他有多大

#设置中文字体
#run = paragraph.add_run(u'设置中文字体，')
#run.font.name=u'宋体'
#r = run._element
#r.rPr.rFonts.set(qn('w:eastAsia'), u'宋体')
#设置粗体小四
paragraph = document.add_paragraph()
run = paragraph.add_run(u'MD5:  ')
run.bold = True
run.font.size=Pt(12)
paragraph = document.add_paragraph()
run = paragraph.add_run(u'TYPE:  ')
run.bold = True
run.font.size=Pt(12)
paragraph = document.add_paragraph()
run = paragraph.add_run(u'文件名称:  ')
run.bold = True
run.font.size=Pt(12)
paragraph = document.add_paragraph()
run = paragraph.add_run(u'文件大小:  ')
run.bold = True #加粗
run.font.size=Pt(12) #小四

#报告1
document.add_picture('./image/2.png', width=Cm(15.24))
paragraph = document.add_paragraph()
run = paragraph.add_run(u'判定:  ')
run.bold = True
run.font.size=Pt(12)

#报告2
document.add_picture('./image/3.png', width=Cm(15.24))
paragraph = document.add_paragraph()
run = paragraph.add_run(u'报告2:  ')
run.bold = True
run.font.size=Pt(12)

#分析总结
document.add_picture('./image/4.png', width=Cm(15.24))
paragraph = document.add_paragraph()
run = paragraph.add_run(u'分析结果:  ')
run.bold = True
run.font.size=Pt(12)

#检测结果
document.add_picture('./image/5.png', width=Cm(15.24))
paragraph = document.add_paragraph()
run = paragraph.add_run(u'检测结果:  ')
run.bold = True
run.font.size=Pt(12)

#关系
document.add_picture('./image/6.png', width=Cm(15.24))
paragraph = document.add_paragraph()
run = paragraph.add_run(u'关系:  ')
run.bold = True #加粗
run.font.size=Pt(12)#小四

#关键字符串
document.add_picture('./image/7.png', width=Cm(15.24))
paragraph = document.add_paragraph()
run = paragraph.add_run(u'关键字符串:  ')
run.bold = True
run.font.size=Pt(12)

head4 = document.add_heading(level=3)
run = head4.add_run(u'附件:')
run.font.size=Pt(18)
run.font.color.rgb=RGBColor(0,0,0)

#注1
head5 = document.add_heading(level=3)
run = head5.add_run(u'注1:')
run.font.size=Pt(15)
run.font.color.rgb=RGBColor(65,186,126)
head5.paragraph_format.line_spacing = Pt(30)

p = document.add_paragraph()
p.paragraph_format.line_spacing = Pt(30)
run = p.add_run(u'''    注解1段落''')
run.font.color.rgb = RGBColor(0, 0, 0)
run.font.size = Pt(12)

#注2
head6 = document.add_heading(level=3)
run = head6.add_run(u'注2:')
run.font.size=Pt(15)
run.font.color.rgb=RGBColor(65,186,126)
head6.paragraph_format.line_spacing = Pt(30)

p = document.add_paragraph()
p.paragraph_format.line_spacing = Pt(30)
run = p.add_run(u'''    注解2段落''')
run.font.color.rgb = RGBColor(0, 0, 0)
run.font.size = Pt(12)

#保存文件
document.save('demo.docx')

# 程序编写一周天气

In [61]:
from docx import Document
from docx.shared import RGBColor
from docx.enum.text import WD_ALIGN_PARAGRAPH
from docx.shared import  Pt
from docx.oxml import OxmlElement
from docx.oxml.ns import  qn
from docx.shared import Inches
from docx.shared import Cm
document = Document()
#报告标题
head = document.add_heading()
document.add_picture('line.png', width=Inches(6))
print(head)
head.paragraph_format.alignment = WD_ALIGN_PARAGRAPH.CENTER
head.paragraph_format.space_before = Pt(36)
run = head.add_run(r"一周天气预测",0)
run.font.size=Pt(36)
run.font.color.rgb=RGBColor(0x00,0x00,0x00) #标题颜色
# document.styles['Normal'].font.name = u'Times New Roman' #设置西文字体
# document.styles['Normal']._element.rPr.rFonts.set(qn('w:eastAsia'), u'宋体') #设置中文字体使用字体2->宋体


p = document.add_paragraph()
run = p.add_run(u'''    段落1fsadfasdf asdf asdf asdfsfasdjf klasdfklj发送大量解放拉萨地方就卡死的理发师就ask了就；拉萨扩大飞机拉萨快递费就
发士大夫阿斯蒂芬安抚阿斯蒂芬阿斯顿阿三大色 
    段落2''')
run.font.color.rgb = RGBColor(0, 0, 0)
run.font.size = Pt(15)
#单倍行距
p.paragraph_format.line_spacing = Pt(30)
#段落后行距
p.paragraph_format.space_after = Pt(30)
document.add_picture('line.png', width=Inches(6))

document.save('demo.docx')

<docx.text.paragraph.Paragraph object at 0x7f06c845d790>


In [None]:
# 读取一周天气预报

# 将pdf转换成图片


In [62]:
!ls

demo.docx	 info.doc  week.doc	  一周天气预测38期.doc
doc_study.ipynb  line.png  wind_rank.jpg  数据表形式.ipynb


In [64]:
#安装库 pip install pymupdf
import os
import fitz
pdf_dir=[]

def get_file():
	docunames = os.listdir()
	for docuname in docunames:
		if os.path.splitext(docuname)[1]=='.pdf': #目录下包含.pdf的文件
			pdf_dir.append(docuname)
def conver_img():
	for pdf in pdf_dir:
		doc = fitz.open(pdf)
		#pdf_name = os.path.splitext(pdf)[0]
		pdf_name = os.path.splitext(pdf)[0]
		print("====================================")
		print("开始转换%s.PDF文档"%pdf_name)
		print("====================================")
		print("共",doc.pageCount,"页")
		for pg in range(0,doc.pageCount):
			print("\r转换为图片",pg+1,"/",doc.pageCount,end=";")
			page=doc[pg]
			rotate = int(0) #旋转角度
			# 每个尺寸的缩放系数为2，这将为我们生成分辨率提高四倍的图像
			zoom_x=2.0
			zoom_y=2.0
			print("")
			trans = fitz.Matrix(zoom_x, zoom_y).preRotate(rotate)
			pm= page.getPixmap(matrix=trans, alpha=False)
			pm.writePNG(r'./tu'+str(pdf_name)+'-'+'{:02}.png'.format(pg))
if __name__=='__main__':
	get_file()
	conver_img()

开始转换一周天气预测47期.PDF文档
共 2 页
转换为图片 1 / 2;
转换为图片 2 / 2;
