django导入导出excel实践

一、xlrd和xlwt模块介绍

   xlrd模块提供在任何平台上从excel电子表格(.xls和.xlsx)中提取数据的功能,xlwt模块提供生成与Microsoft Excel 95 到2003版本兼容的excel文件的功能。

1、安装方法

# 方法一:
pip3 install xlrd
pip3 install xlwt

# 方法二:
    在python官网http://pypi.python.org/pypi/xlrd/(xlwt)下载xlrd/xlwt的安装包。
    压缩包放置在python安装目录下python/Lib/site-packages。
    解压压缩包:tar zxvf xlrd-1.0.0.tar.gz
    进入到解压的文件夹:cd xlrd-1.0.0
    执行命令:python setup,py install

2、xlrd使用详解

(1)excel文档准备

  准备excel文档:联系人.xls,内容如下所示:

  

  

(2)xlrd获取sheet工作表名称和对象

import xlrd

# 打开Excel文件读取器,加上utf-8编码可防止遇到中文字符乱码
data = xlrd.open_workbook('联系人.xls', encoding_override='utf-8')

# 获取所有sheet工作表名称
sheetnames = data.sheet_names()
print(sheetnames)
"""
['银行1', '银行2']
"""
# 通过索引获取指定sheet工作表名称
sheet_name = data.sheet_names()[1]
print(sheet_name)
"""
银行2
"""
# 通过工作表名称获取sheet对象
table_name = data.sheet_by_name(sheet_name)
print(table_name)
"""
<xlrd.sheet.Sheet object at 0x10b657160>
"""
# 通过sheet索引获取sheet工作表对象
table_index = data.sheet_by_index(0)
print(table_index)
"""
<xlrd.sheet.Sheet object at 0x1073b3f28>
"""

(3)sheet工作表行/列操作

# 获取行数和列数
nrows = table_name.nrows     # 总行数
ncols = table_name.ncols     # 总列数
print("银行2表,总行数: %s,总列数: %s" % (nrows, ncols))
"""
银行2表,总行数: 5,总列数: 7
"""
# 根据sheet对象获取整行和整列的值
sheet_row_val = table_name.row_values(3)
sheet_col_val = table_name.col_values(3)
print("整行的值:%s , \n整列的值: %s" % (sheet_row_val, sheet_col_val))
"""
整行的值:['', '李九', '开发', 'IOS开发', 87888.0, 13213123.0, 'wang1@164.com'] , 
整列的值: ['', '工作职责', 'UI设计', 'IOS开发', '硬件维护']
"""
# 获取当前行的有效单元格长度
print(table_name.row_len(3))
print(table_index.row_len(3))
"""
7
8
"""

(4)sheet工作表单元格操作

  单元格是组成表格的最小单位,可以拆分或合并。每个数据的输入和修改都是在单元格中进行的。

# 获取指定单元格内容
print(table_name.cell(1,0).value)    # 第二行第一列
print(table_name.cell_value(2,1))    # 第三行第二列
print(table_name.row(1)[0].value)    # 第二行第一列
"""
机构名称
张八
机构名称
"""
# 获取单元格内容的数据类型
# ctype说明:0 empty, 1 string, 2 number, 3 date, 4 boolean, 5 error
print(table_index.cell(1,0).ctype)   # 银行1表,2行1列内容  机构名称
print(table_index.cell(3,4).ctype)   # 银行1表,4行5列内容  888
print(table_index.cell(2,6).ctype)   # 银行1表,3行7列内容  2019/5/7
"""
1
2
3
"""
# 日期单元格内容处理
from datetime import datetime, date
if table_index.cell(2,6).ctype == 3:
    print(table_index.cell(2, 6).value)
    date_value = xlrd.xldate_as_tuple(table_index.cell(2, 6).value, data.datemode)
    print(date_value)
    print(date(*date_value[:3]))
    print(date(*date_value[:3]).strftime('%Y/%m/%d'))
"""
43592.0
(2019, 5, 7, 0, 0, 0)
2019-05-07
2019/05/07
"""
# 获取number类型的单元格内容
if table_index.cell(3, 4).ctype == 2:
    print(table_index.cell(3, 4).value)
    num_value = int(table_index.cell(3, 4).value)   # 转为整型
    print(num_value)
"""
888.0
888
""" 

(5)获取合并单元格内容

  需要使用merged_cells属性,获取merged_cells返回的row和col低位的索引即可。

# 需要在读取文件时添加formatting_info参数,默认是False
# 需要设置为True,才能调用merged_cells属性获取到值
xls_data = xlrd.open_workbook('联系人.xls', formatting_info=True)
sheet_data = xls_data.sheet_by_name('银行2')
print(sheet_data.merged_cells)
"""
[(0, 1, 0, 7), (2, 5, 0, 1)]
"""

  merged_cells返回的这四个参数的含义:(row,row_range,col,col_range)。

  因此,(0,1,0,7)表示第1列~第7列合并;(2,5,0,1)表示第3行~第6行合并。

# 分别获取合并两个单元格内容
merge_value = []
for (row, row_range, col, col_range) in sheet_data.merged_cells:
    merge_value.append((row, col))
"""
[(0, 0), (2, 0)]
"""
print(merge_value)
for i in merge_value:
    print(sheet_data.cell(i[0], i[1]).value)
"""
银行2
银行2
"""

3、xlwt使用详解

  使用xlwt模块对Excel文件进行创建、设置、保存等操作。

import xlwt

# 创建一个工作簿(workbook),并设置编码
# workbook = xlwt.Workbook(encoding='ascii')
workbook = xlwt.Workbook(encoding='utf-8')

# 创建一个工作表(worksheet)
worksheet = workbook.add_sheet("My Worksheet")

# 样式设置(可选)
style = xlwt.XFStyle()   # 初始化样式
font = xlwt.Font()       # 为样式创建字体
font.name = "Times New Roman"
font.bold = True         # 加粗
font.underline = True    # 下划线
font.italic = True       # 斜体字
style.font = font        # 设定样式

# 写入excel,参数对应 行 列 值
# 不带样式的写入
worksheet.write(1,0, 'Unformatted value')
# 带样式的写入
worksheet.write(2,0, 'Formatted value', style)

# 保存文件
workbook.save("xlwt_test.xls")

  打开Excel文件显示效果如下:

  

(1)设置单元格宽度

import xlwt

workbook = xlwt.Workbook()
worksheet = workbook.add_sheet('My Sheet')
worksheet.write(0, 0,'My Cell Contents')
# 设置单元格宽度
worksheet.col(0).width = 30003
workbook.save('cell_width.xls')

  显示效果:

  

(2)输入日期到单元格

import xlwt
import datetime

workbook = xlwt.Workbook()
worksheet = workbook.add_sheet('My Sheet')

style = xlwt.XFStyle()
style.num_format_str = 'M/D/YY' # Other options: D-MMM-YY, D-MMM, MMM-YY, h:mm, h:mm:ss, h:mm, h:mm:ss, M/D/YY h:mm, mm:ss, [h]:mm:ss, mm:ss.0

worksheet.write(0, 0, datetime.datetime.now(), style)
workbook.save('Excel_Workbook.xls')

  显示效果:

  

(3)添加公式到单元格

import xlwt

workbook = xlwt.Workbook()
worksheet = workbook.add_sheet('My Sheet')
worksheet.write(0, 0, 5) # Outputs 5
worksheet.write(0, 1, 2) # Outputs 2

# 添加公式
worksheet.write(1, 0, xlwt.Formula('A1*B1')) # Should output "10" (A1[5] * A2[2])
worksheet.write(1, 1, xlwt.Formula('SUM(A1,B1)')) # Should output "7" (A1[5] + A2[2])

workbook.save('Excel_formula.xls')

  显示效果:

  

(4)添加超链接到单元格

import xlwt

workbook = xlwt.Workbook()
worksheet = workbook.add_sheet('My Sheet')

worksheet.write(0, 0, xlwt.Formula('HYPERLINK("http://www.baidu.com";"Baidu")')) # Outputs the text "Baidu" linking to http://www.baidu.com

workbook.save('Excel_hyperlink.xls')

  显示效果:

  

(5)合并列和行

import xlwt

workbook = xlwt.Workbook()
worksheet = workbook.add_sheet('My Sheet')

worksheet.write_merge(0, 0, 0, 3, 'First Merge') # Merges row 0's columns 0 through 3.
font = xlwt.Font() # Create Font
font.bold = True # Set font to Bold
style = xlwt.XFStyle() # Create Style
style.font = font # Add Bold Font to Style
worksheet.write_merge(1, 2, 0, 3, 'Second Merge', style) # Merges row 1 through 2's columns 0 through 3.
workbook.save('Excel_merge.xls')

  显示效果:

  

(6)其他单元格设置

"""
设置单元格内容的对其方式:
"""
import xlwt
workbook = xlwt.Workbook()
worksheet = workbook.add_sheet('My Sheet')
alignment = xlwt.Alignment() # Create Alignment
alignment.horz = xlwt.Alignment.HORZ_CENTER # May be: HORZ_GENERAL, HORZ_LEFT, HORZ_CENTER, HORZ_RIGHT, HORZ_FILLED, HORZ_JUSTIFIED, HORZ_CENTER_ACROSS_SEL, HORZ_DISTRIBUTED
alignment.vert = xlwt.Alignment.VERT_CENTER # May be: VERT_TOP, VERT_CENTER, VERT_BOTTOM, VERT_JUSTIFIED, VERT_DISTRIBUTED
style = xlwt.XFStyle() # Create Style
style.alignment = alignment # Add Alignment to Style
worksheet.write(0, 0, 'Cell Contents', style)
workbook.save('Excel_Workbook.xls')

"""
为单元格议添加边框:
"""
# Please note: While I was able to find these constants within the source code, on my system (using LibreOffice,) I was only presented with a solid line, varying from thin to thick; no dotted or dashed lines.
import xlwt
workbook = xlwt.Workbook()
worksheet = workbook.add_sheet('My Sheet')
borders = xlwt.Borders() # Create Borders
borders.left = xlwt.Borders.DASHED
  DASHED虚线
  NO_LINE没有
  THIN实线
# May be: NO_LINE, THIN, MEDIUM, DASHED, DOTTED, THICK, DOUBLE, HAIR, MEDIUM_DASHED, THIN_DASH_DOTTED, MEDIUM_DASH_DOTTED, THIN_DASH_DOT_DOTTED, MEDIUM_DASH_DOT_DOTTED, SLANTED_MEDIUM_DASH_DOTTED, or 0x00 through 0x0D.
borders.right = xlwt.Borders.DASHED
borders.top = xlwt.Borders.DASHED
borders.bottom = xlwt.Borders.DASHED
borders.left_colour = 0x40
borders.right_colour = 0x40
borders.top_colour = 0x40
borders.bottom_colour = 0x40
style = xlwt.XFStyle() # Create Style
style.borders = borders # Add Borders to Style
worksheet.write(0, 0, 'Cell Contents', style)
workbook.save('Excel_Workbook.xls')

"""
为单元格设置背景色:
"""
import xlwt
workbook = xlwt.Workbook()
worksheet = workbook.add_sheet('My Sheet')
pattern = xlwt.Pattern() # Create the Pattern
pattern.pattern = xlwt.Pattern.SOLID_PATTERN # May be: NO_PATTERN, SOLID_PATTERN, or 0x00 through 0x12
pattern.pattern_fore_colour = 5 # May be: 8 through 63. 0 = Black, 1 = White, 2 = Red, 3 = Green, 4 = Blue, 5 = Yellow, 6 = Magenta, 7 = Cyan, 16 = Maroon, 17 = Dark Green, 18 = Dark Blue, 19 = Dark Yellow , almost brown), 20 = Dark Magenta, 21 = Teal, 22 = Light Gray, 23 = Dark Gray, the list goes on...
style = xlwt.XFStyle() # Create the Pattern
style.pattern = pattern # Add Pattern to Style
worksheet.write(0, 0, 'Cell Contents', style)
workbook.save('Excel_Workbook.xls')

二、导出excel表(读django字段数据)

  在django项目中实现用excel导出数据库中数据。

1、添加导出excel路由 

  这里是基于crm项目实现,在customer配置类中添加excel路由:

class CustomerConfig(ModelStark):
    """代码省略"""
    def extra_url(self):
        """扩展路由"""
        temp = []
        temp.append(url(r"mycustomer/", self.mycustomer))
        temp.append(url(r'export/', self.excel_export))
        return temp

 

2、导出excel视图函数

# 注册客户(学生)到stark
class CustomerConfig(ModelStark):
    """代码省略"""

    def excel_export(self, request):
        """导出excel表格"""
        list_obj = models.Customer.objects.all().order_by("create_time")
        if list_obj:
            # 创建工作薄
            ws = Workbook(encoding="UTF-8")
            w = ws.add_sheet(u'数据报表第一页')
            w.write(0, 0, 'id')
            w.write(0, 1, u'姓名')
            w.write(0, 2, u'性别')
            w.write(0, 3, u'民族')
            w.write(0, 4, u'籍贯')
            w.write(0, 5, u'身份证号')
            w.write(0, 6, u'通知书邮寄地址')
            w.write(0, 7, u'邮编')
            w.write(0, 8, u'联系电话')
            w.write(0, 9, u'联系电话2')
            w.write(0, 10, u'院校')
            w.write(0, 11, u'专业')
            w.write(0, 12, u'创建日期')
            w.write(0, 13, u'生源人')
            w.write(0, 14, u'备注')
            # 写入数据
            excel_row = 1
            for obj in list_obj:
                data_id = obj.id
                data_name = obj.name
                # data_gender = obj.gender_choices  # 只显示数字
                data_gender = obj.get_gender_display()
                data_nation = obj.nation
                data_birth = obj.birth_place
                data_identity_num = obj.identity_num
                data_address = obj.address
                data_postcode = obj.postcode
                data_tel = obj.tel
                data_tel2 = obj.tel_2
                data_school = obj.stu_school.title
                data_course = obj.course.first().name
                data_time = obj.create_time.strftime('%Y-%m-%d %H:%M:%S')
                data_consultant = obj.consultant.name
                data_memo = obj.memo
                w.write(excel_row, 0, data_id)
                w.write(excel_row, 1, data_name)
                w.write(excel_row, 2, data_gender)
                w.write(excel_row, 3, data_nation)
                w.write(excel_row, 4, data_birth)
                w.write(excel_row, 5, data_identity_num)
                w.write(excel_row, 6, data_address)
                w.write(excel_row, 7, data_postcode)
                w.write(excel_row, 8, data_tel)
                w.write(excel_row, 9, data_tel2)
                w.write(excel_row, 10, data_school)
                w.write(excel_row, 11, data_course)
                w.write(excel_row, 12, data_time)
                w.write(excel_row, 13, data_consultant)
                w.write(excel_row, 14, data_memo)
                excel_row += 1
                # 检测文件是否存在
                # 方框中代码是保存本地文件使用,如不需要请删除该代码
                ###########################
            exist_file = os.path.exists("stu_info.xls")
            if exist_file:
                os.remove(r"stu_info.xls")
            ws.save("customer_info.xls")
            ############################
            sio = BytesIO()
            ws.save(sio)
            sio.seek(0)
            response = HttpResponse(sio.getvalue(), content_type='application/vnd.ms-excel')
            response['Content-Disposition'] = 'attachment; filename=stu_info.xls'
            response.write(sio.getvalue())
            return response

 

(1)获取日期并转化格式

data_time = obj.create_time.strftime('%Y-%m-%d %H:%M:%S')

 

(2)获取一对多对象名称

data_consultant = obj.consultant.name

 

(3)获取多对多对象名称

data_course = obj.course.first().name

 

3、将注册的模型类添加到字典_registry中

site.register(models.Customer, CustomerConfig)

 

三、导入excel表(插入django字段数据)

  导入时,一对多字段和多对多字段处理需要特别注意。

1、添加导入Excel路由

# 注册客户(学生)到stark
class CustomerConfig(ModelStark):
    def extra_url(self):
        """扩展路由"""
        temp = []
        temp.append(url(r"mycustomer/", self.mycustomer))
        temp.append(url(r'export/', self.excel_export))
        temp.append(url(r'import/', self.excel_import))
        return temp

 

2、导入Excel视图函数

# 注册客户(学生)到stark
class CustomerConfig(ModelStark):
    """省略代码"""
    def excel_import(self, request):
        """批量导入数据"""
        if request.method == 'GET':
            return render(request, 'excel_import.html', locals())
            # return JsonResponse({'msg': '不是post请求'})
        else:
            user_id = request.session.get("user_id")
            file_obj = request.FILES.get('my_file')
            type_excel = file_obj.name.split('.')[1]
            if 'xls' == type_excel:
                # 开始解析上传的excel表格
                wb = xlrd.open_workbook(filename=None, file_contents=file_obj.read())
                table = wb.sheets()[0]
                nrows = table.nrows    # 行数
                # ncole = table.ncols  # 列数
                try:
                    # 正常的数据库操作应该是原子性操作
                    with transaction.atomic():
                        for i in range(1, nrows):
                            # i/o
                            row_value = table.row_values(i)   # 一行的数据
                            # 添加多对多字段
                            # 主要这里不能使用get,否则报错:'Course' object is not iterable
                            course_obj = models.Course.objects.filter(name=row_value[9])
                            print(row_value[10], type(row_value[10]))  # 1002.0 <class 'float'>
                            consultant_obj = models.UserInfo.objects.get(code=str(int(row_value[10])))
                            # 生成学生对象,添加
                            customer_obj = models.Customer.objects.create(
                                name=row_value[0],
                                gender=row_value[1],
                                nation=row_value[2],
                                birth_place=row_value[3],
                                identity_num=row_value[4],
                                address=row_value[5],
                                postcode=row_value[6],
                                tel=row_value[7],
                                tel_2=row_value[8],
                                stu_school_id=1,
                                create_time=datetime.datetime.now(),
                                consultant=consultant_obj,    # 一对多字段
                                memo=row_value[11]
                            )
                            # create的时候不写多对多字段,写完后单独设置即可
                            customer_obj.course.set(course_obj)
                except Exception as e:
                    return HttpResponse('出现错误...%s' % e)
                return HttpResponse("上传成功")
            return HttpResponse('上传文件格式不是xls')

(1)一对多字段

  consultant字段是一对多字段,使用如下方法添加:

consultant_obj = models.UserInfo.objects.get(code=str(int(row_value[10])))
# 生成学生对象,添加
customer_obj = models.Customer.objects.create(
    """代码省略"""
    consultant=consultant_obj,    # 一对多字段
)

 

(2)多对多字段

  course字段是多对多字段,使用如下方法添加:

# 添加多对多字段
# 主要这里不能使用get,否则报错:'Course' object is not iterable
course_obj = models.Course.objects.filter(name=row_value[9])
print(row_value[10], type(row_value[10]))  # 1002.0 <class 'float'>
# 生成学生对象,添加
customer_obj = models.Customer.objects.create("""代码省略""")
# create的时候不写多对多字段,写完后单独设置即可
customer_obj.course.set(course_obj)

 

posted @ 2019-05-23 15:56  休耕  阅读(15379)  评论(0编辑  收藏  举报