一、xlrd和xlwt模块介绍
xlrd模块提供在任何平台上从excel电子表格(.xls和.xlsx)中提取数据的功能,xlwt模块提供生成与Microsoft Excel 95 到2003版本兼容的excel文件的功能。
1、安装方法
# 方法一:
pip3 install xlrd
pip3 install xlwt # 方法二:
在python官网http://pypi.python.org/pypi/xlrd/(xlwt)下载xlrd/xlwt的安装包。
压缩包放置在python安装目录下python/Lib/site-packages。
解压压缩包:tar zxvf xlrd-1.0.0.tar.gz
进入到解压的文件夹:cd xlrd-1.0.0
执行命令:python setup,py install
2、xlrd使用详解
(1)excel文档准备
准备excel文档:联系人.xls,内容如下所示:
(2)xlrd获取sheet工作表名称和对象
import xlrd # 打开Excel文件读取器,加上utf-8编码可防止遇到中文字符乱码
data = xlrd.open_workbook('联系人.xls', encoding_override='utf-8') # 获取所有sheet工作表名称
sheetnames = data.sheet_names()
print(sheetnames)
"""
['银行1', '银行2']
"""
# 通过索引获取指定sheet工作表名称
sheet_name = data.sheet_names()[1]
print(sheet_name)
"""
银行2
"""
# 通过工作表名称获取sheet对象
table_name = data.sheet_by_name(sheet_name)
print(table_name)
"""
<xlrd.sheet.Sheet object at 0x10b657160>
"""
# 通过sheet索引获取sheet工作表对象
table_index = data.sheet_by_index(0)
print(table_index)
"""
<xlrd.sheet.Sheet object at 0x1073b3f28>
"""
(3)sheet工作表行/列操作
# 获取行数和列数
nrows = table_name.nrows # 总行数
ncols = table_name.ncols # 总列数
print("银行2表,总行数: %s,总列数: %s" % (nrows, ncols))
"""
银行2表,总行数: 5,总列数: 7
"""
# 根据sheet对象获取整行和整列的值
sheet_row_val = table_name.row_values(3)
sheet_col_val = table_name.col_values(3)
print("整行的值:%s , \n整列的值: %s" % (sheet_row_val, sheet_col_val))
"""
整行的值:['', '李九', '开发', 'IOS开发', 87888.0, 13213123.0, 'wang1@164.com'] ,
整列的值: ['', '工作职责', 'UI设计', 'IOS开发', '硬件维护']
"""
# 获取当前行的有效单元格长度
print(table_name.row_len(3))
print(table_index.row_len(3))
"""
7
8
"""
(4)sheet工作表单元格操作
单元格是组成表格的最小单位,可以拆分或合并。每个数据的输入和修改都是在单元格中进行的。
# 获取指定单元格内容
print(table_name.cell(1,0).value) # 第二行第一列
print(table_name.cell_value(2,1)) # 第三行第二列
print(table_name.row(1)[0].value) # 第二行第一列
"""
机构名称
张八
机构名称
"""
# 获取单元格内容的数据类型
# ctype说明:0 empty, 1 string, 2 number, 3 date, 4 boolean, 5 error
print(table_index.cell(1,0).ctype) # 银行1表,2行1列内容 机构名称
print(table_index.cell(3,4).ctype) # 银行1表,4行5列内容 888
print(table_index.cell(2,6).ctype) # 银行1表,3行7列内容 2019/5/7
"""
1
2
3
"""
# 日期单元格内容处理
from datetime import datetime, date
if table_index.cell(2,6).ctype == 3:
print(table_index.cell(2, 6).value)
date_value = xlrd.xldate_as_tuple(table_index.cell(2, 6).value, data.datemode)
print(date_value)
print(date(*date_value[:3]))
print(date(*date_value[:3]).strftime('%Y/%m/%d'))
"""
43592.0
(2019, 5, 7, 0, 0, 0)
2019-05-07
2019/05/07
"""
# 获取number类型的单元格内容
if table_index.cell(3, 4).ctype == 2:
print(table_index.cell(3, 4).value)
num_value = int(table_index.cell(3, 4).value) # 转为整型
print(num_value)
"""
888.0
888
"""
(5)获取合并单元格内容
需要使用merged_cells属性,获取merged_cells返回的row和col低位的索引即可。
# 需要在读取文件时添加formatting_info参数,默认是False
# 需要设置为True,才能调用merged_cells属性获取到值
xls_data = xlrd.open_workbook('联系人.xls', formatting_info=True)
sheet_data = xls_data.sheet_by_name('银行2')
print(sheet_data.merged_cells)
"""
[(0, 1, 0, 7), (2, 5, 0, 1)]
"""
merged_cells返回的这四个参数的含义:(row,row_range,col,col_range)。
因此,(0,1,0,7)表示第1列~第7列合并;(2,5,0,1)表示第3行~第6行合并。
# 分别获取合并两个单元格内容
merge_value = []
for (row, row_range, col, col_range) in sheet_data.merged_cells:
merge_value.append((row, col))
"""
[(0, 0), (2, 0)]
"""
print(merge_value)
for i in merge_value:
print(sheet_data.cell(i[0], i[1]).value)
"""
银行2
银行2
"""
3、xlwt使用详解
使用xlwt模块对Excel文件进行创建、设置、保存等操作。
import xlwt # 创建一个工作簿(workbook),并设置编码
# workbook = xlwt.Workbook(encoding='ascii')
workbook = xlwt.Workbook(encoding='utf-8') # 创建一个工作表(worksheet)
worksheet = workbook.add_sheet("My Worksheet") # 样式设置(可选)
style = xlwt.XFStyle() # 初始化样式
font = xlwt.Font() # 为样式创建字体
font.name = "Times New Roman"
font.bold = True # 加粗
font.underline = True # 下划线
font.italic = True # 斜体字
style.font = font # 设定样式 # 写入excel,参数对应 行 列 值
# 不带样式的写入
worksheet.write(1,0, 'Unformatted value')
# 带样式的写入
worksheet.write(2,0, 'Formatted value', style) # 保存文件
workbook.save("xlwt_test.xls")
打开Excel文件显示效果如下:
(1)设置单元格宽度
import xlwt workbook = xlwt.Workbook()
worksheet = workbook.add_sheet('My Sheet')
worksheet.write(0, 0,'My Cell Contents')
# 设置单元格宽度
worksheet.col(0).width = 30003
workbook.save('cell_width.xls')
显示效果:
(2)输入日期到单元格
import xlwt
import datetime workbook = xlwt.Workbook()
worksheet = workbook.add_sheet('My Sheet') style = xlwt.XFStyle()
style.num_format_str = 'M/D/YY' # Other options: D-MMM-YY, D-MMM, MMM-YY, h:mm, h:mm:ss, h:mm, h:mm:ss, M/D/YY h:mm, mm:ss, [h]:mm:ss, mm:ss.0 worksheet.write(0, 0, datetime.datetime.now(), style)
workbook.save('Excel_Workbook.xls')
显示效果:
(3)添加公式到单元格
import xlwt workbook = xlwt.Workbook()
worksheet = workbook.add_sheet('My Sheet')
worksheet.write(0, 0, 5) # Outputs 5
worksheet.write(0, 1, 2) # Outputs 2 # 添加公式
worksheet.write(1, 0, xlwt.Formula('A1*B1')) # Should output "10" (A1[5] * A2[2])
worksheet.write(1, 1, xlwt.Formula('SUM(A1,B1)')) # Should output "7" (A1[5] + A2[2]) workbook.save('Excel_formula.xls')
显示效果:
(4)添加超链接到单元格
import xlwt workbook = xlwt.Workbook()
worksheet = workbook.add_sheet('My Sheet') worksheet.write(0, 0, xlwt.Formula('HYPERLINK("http://www.baidu.com";"Baidu")')) # Outputs the text "Baidu" linking to http://www.baidu.com workbook.save('Excel_hyperlink.xls')
显示效果:
(5)合并列和行
import xlwt workbook = xlwt.Workbook()
worksheet = workbook.add_sheet('My Sheet') worksheet.write_merge(0, 0, 0, 3, 'First Merge') # Merges row 0's columns 0 through 3.
font = xlwt.Font() # Create Font
font.bold = True # Set font to Bold
style = xlwt.XFStyle() # Create Style
style.font = font # Add Bold Font to Style
worksheet.write_merge(1, 2, 0, 3, 'Second Merge', style) # Merges row 1 through 2's columns 0 through 3.
workbook.save('Excel_merge.xls')
显示效果:
(6)其他单元格设置
"""
设置单元格内容的对其方式:
"""
import xlwt
workbook = xlwt.Workbook()
worksheet = workbook.add_sheet('My Sheet')
alignment = xlwt.Alignment() # Create Alignment
alignment.horz = xlwt.Alignment.HORZ_CENTER # May be: HORZ_GENERAL, HORZ_LEFT, HORZ_CENTER, HORZ_RIGHT, HORZ_FILLED, HORZ_JUSTIFIED, HORZ_CENTER_ACROSS_SEL, HORZ_DISTRIBUTED
alignment.vert = xlwt.Alignment.VERT_CENTER # May be: VERT_TOP, VERT_CENTER, VERT_BOTTOM, VERT_JUSTIFIED, VERT_DISTRIBUTED
style = xlwt.XFStyle() # Create Style
style.alignment = alignment # Add Alignment to Style
worksheet.write(0, 0, 'Cell Contents', style)
workbook.save('Excel_Workbook.xls') """
为单元格议添加边框:
"""
# Please note: While I was able to find these constants within the source code, on my system (using LibreOffice,) I was only presented with a solid line, varying from thin to thick; no dotted or dashed lines.
import xlwt
workbook = xlwt.Workbook()
worksheet = workbook.add_sheet('My Sheet')
borders = xlwt.Borders() # Create Borders
borders.left = xlwt.Borders.DASHED
DASHED虚线
NO_LINE没有
THIN实线
# May be: NO_LINE, THIN, MEDIUM, DASHED, DOTTED, THICK, DOUBLE, HAIR, MEDIUM_DASHED, THIN_DASH_DOTTED, MEDIUM_DASH_DOTTED, THIN_DASH_DOT_DOTTED, MEDIUM_DASH_DOT_DOTTED, SLANTED_MEDIUM_DASH_DOTTED, or 0x00 through 0x0D.
borders.right = xlwt.Borders.DASHED
borders.top = xlwt.Borders.DASHED
borders.bottom = xlwt.Borders.DASHED
borders.left_colour = 0x40
borders.right_colour = 0x40
borders.top_colour = 0x40
borders.bottom_colour = 0x40
style = xlwt.XFStyle() # Create Style
style.borders = borders # Add Borders to Style
worksheet.write(0, 0, 'Cell Contents', style)
workbook.save('Excel_Workbook.xls') """
为单元格设置背景色:
"""
import xlwt
workbook = xlwt.Workbook()
worksheet = workbook.add_sheet('My Sheet')
pattern = xlwt.Pattern() # Create the Pattern
pattern.pattern = xlwt.Pattern.SOLID_PATTERN # May be: NO_PATTERN, SOLID_PATTERN, or 0x00 through 0x12
pattern.pattern_fore_colour = 5 # May be: 8 through 63. 0 = Black, 1 = White, 2 = Red, 3 = Green, 4 = Blue, 5 = Yellow, 6 = Magenta, 7 = Cyan, 16 = Maroon, 17 = Dark Green, 18 = Dark Blue, 19 = Dark Yellow , almost brown), 20 = Dark Magenta, 21 = Teal, 22 = Light Gray, 23 = Dark Gray, the list goes on...
style = xlwt.XFStyle() # Create the Pattern
style.pattern = pattern # Add Pattern to Style
worksheet.write(0, 0, 'Cell Contents', style)
workbook.save('Excel_Workbook.xls')
二、导出excel表(读django字段数据)
在django项目中实现用excel导出数据库中数据。
1、添加导出excel路由
这里是基于crm项目实现,在customer配置类中添加excel路由:
class CustomerConfig(ModelStark):
"""代码省略"""
def extra_url(self):
"""扩展路由"""
temp = []
temp.append(url(r"mycustomer/", self.mycustomer))
temp.append(url(r'export/', self.excel_export))
return temp
2、导出excel视图函数
# 注册客户(学生)到stark
class CustomerConfig(ModelStark):
"""代码省略""" def excel_export(self, request):
"""导出excel表格"""
list_obj = models.Customer.objects.all().order_by("create_time")
if list_obj:
# 创建工作薄
ws = Workbook(encoding="UTF-8")
w = ws.add_sheet(u'数据报表第一页')
w.write(0, 0, 'id')
w.write(0, 1, u'姓名')
w.write(0, 2, u'性别')
w.write(0, 3, u'民族')
w.write(0, 4, u'籍贯')
w.write(0, 5, u'身份证号')
w.write(0, 6, u'通知书邮寄地址')
w.write(0, 7, u'邮编')
w.write(0, 8, u'联系电话')
w.write(0, 9, u'联系电话2')
w.write(0, 10, u'院校')
w.write(0, 11, u'专业')
w.write(0, 12, u'创建日期')
w.write(0, 13, u'生源人')
w.write(0, 14, u'备注')
# 写入数据
excel_row = 1
for obj in list_obj:
data_id = obj.id
data_name = obj.name
# data_gender = obj.gender_choices # 只显示数字
data_gender = obj.get_gender_display()
data_nation = obj.nation
data_birth = obj.birth_place
data_identity_num = obj.identity_num
data_address = obj.address
data_postcode = obj.postcode
data_tel = obj.tel
data_tel2 = obj.tel_2
data_school = obj.stu_school.title
data_course = obj.course.first().name
data_time = obj.create_time.strftime('%Y-%m-%d %H:%M:%S')
data_consultant = obj.consultant.name
data_memo = obj.memo
w.write(excel_row, 0, data_id)
w.write(excel_row, 1, data_name)
w.write(excel_row, 2, data_gender)
w.write(excel_row, 3, data_nation)
w.write(excel_row, 4, data_birth)
w.write(excel_row, 5, data_identity_num)
w.write(excel_row, 6, data_address)
w.write(excel_row, 7, data_postcode)
w.write(excel_row, 8, data_tel)
w.write(excel_row, 9, data_tel2)
w.write(excel_row, 10, data_school)
w.write(excel_row, 11, data_course)
w.write(excel_row, 12, data_time)
w.write(excel_row, 13, data_consultant)
w.write(excel_row, 14, data_memo)
excel_row += 1
# 检测文件是否存在
# 方框中代码是保存本地文件使用,如不需要请删除该代码
###########################
exist_file = os.path.exists("stu_info.xls")
if exist_file:
os.remove(r"stu_info.xls")
ws.save("customer_info.xls")
############################
sio = BytesIO()
ws.save(sio)
sio.seek(0)
response = HttpResponse(sio.getvalue(), content_type='application/vnd.ms-excel')
response['Content-Disposition'] = 'attachment; filename=stu_info.xls'
response.write(sio.getvalue())
return response
(1)获取日期并转化格式
data_time = obj.create_time.strftime('%Y-%m-%d %H:%M:%S')
(2)获取一对多对象名称
data_consultant = obj.consultant.name
(3)获取多对多对象名称
data_course = obj.course.first().name
3、将注册的模型类添加到字典_registry中
site.register(models.Customer, CustomerConfig)
三、导入excel表(插入django字段数据)
导入时,一对多字段和多对多字段处理需要特别注意。
1、添加导入Excel路由
# 注册客户(学生)到stark
class CustomerConfig(ModelStark):
def extra_url(self):
"""扩展路由"""
temp = []
temp.append(url(r"mycustomer/", self.mycustomer))
temp.append(url(r'export/', self.excel_export))
temp.append(url(r'import/', self.excel_import))
return temp
2、导入Excel视图函数
# 注册客户(学生)到stark
class CustomerConfig(ModelStark):
"""省略代码"""
def excel_import(self, request):
"""批量导入数据"""
if request.method == 'GET':
return render(request, 'excel_import.html', locals())
# return JsonResponse({'msg': '不是post请求'})
else:
user_id = request.session.get("user_id")
file_obj = request.FILES.get('my_file')
type_excel = file_obj.name.split('.')[1]
if 'xls' == type_excel:
# 开始解析上传的excel表格
wb = xlrd.open_workbook(filename=None, file_contents=file_obj.read())
table = wb.sheets()[0]
nrows = table.nrows # 行数
# ncole = table.ncols # 列数
try:
# 正常的数据库操作应该是原子性操作
with transaction.atomic():
for i in range(1, nrows):
# i/o
row_value = table.row_values(i) # 一行的数据
# 添加多对多字段
# 主要这里不能使用get,否则报错:'Course' object is not iterable
course_obj = models.Course.objects.filter(name=row_value[9])
print(row_value[10], type(row_value[10])) # 1002.0 <class 'float'>
consultant_obj = models.UserInfo.objects.get(code=str(int(row_value[10])))
# 生成学生对象,添加
customer_obj = models.Customer.objects.create(
name=row_value[0],
gender=row_value[1],
nation=row_value[2],
birth_place=row_value[3],
identity_num=row_value[4],
address=row_value[5],
postcode=row_value[6],
tel=row_value[7],
tel_2=row_value[8],
stu_school_id=1,
create_time=datetime.datetime.now(),
consultant=consultant_obj, # 一对多字段
memo=row_value[11]
)
# create的时候不写多对多字段,写完后单独设置即可
customer_obj.course.set(course_obj)
except Exception as e:
return HttpResponse('出现错误...%s' % e)
return HttpResponse("上传成功")
return HttpResponse('上传文件格式不是xls')
(1)一对多字段
consultant字段是一对多字段,使用如下方法添加:
consultant_obj = models.UserInfo.objects.get(code=str(int(row_value[10])))
# 生成学生对象,添加
customer_obj = models.Customer.objects.create(
"""代码省略"""
consultant=consultant_obj, # 一对多字段
)
(2)多对多字段
course字段是多对多字段,使用如下方法添加:
# 添加多对多字段
# 主要这里不能使用get,否则报错:'Course' object is not iterable
course_obj = models.Course.objects.filter(name=row_value[9])
print(row_value[10], type(row_value[10])) # 1002.0 <class 'float'>
# 生成学生对象,添加
customer_obj = models.Customer.objects.create("""代码省略""")
# create的时候不写多对多字段,写完后单独设置即可
customer_obj.course.set(course_obj)