当前位置：首页 > news >正文

mysql导出sql脚本，通过python脚本生成数据库word文档

news 2026/6/15 19:55:11

mysql导出sql脚本，通过python脚本生成数据库word文档

import re
from docx import Document
from docx.shared import Cm, Pt
from docx.enum.text import WD_ALIGN_PARAGRAPH
import osdef extract_all_tables_from_sql_file(file_path):"""从SQL文件中提取所有表结构"""tables = {}try:with open(file_path, 'r', encoding='utf-8', errors='ignore') as f:content = f.read()# 查找所有CREATE TABLE语句create_table_pattern = r'CREATE\s+TABLE\s+(?:IF\s+NOT\s+EXISTS\s+)?`?([a-zA-Z_][a-zA-Z0-9_]*)`?\s*\((.*?)\)\s*ENGINE\s*='matches = re.findall(create_table_pattern, content, re.DOTALL | re.IGNORECASE)print(f"找到 {len(matches)} 个表定义")for i, (table_name, table_body) in enumerate(matches, 1):print(f"解析表 {i}: {table_name}")fields = parse_table_body_simple(table_body)if fields:tables[table_name] = fieldsprint(f"  -> 找到 {len(fields)} 个字段")else:print(f"  -> 警告: 未找到字段")except Exception as e:print(f"读取文件时出错: {e}")return tablesdef parse_table_body_simple(table_body):"""简单解析表体"""fields = []# 清理表体table_body = table_body.strip()# 分割字段行lines = []current_line = ''in_quotes = Falsequote_char = ''paren_depth = 0for char in table_body:if char in ("'", '"') and (not in_quotes or char == quote_char):in_quotes = not in_quotesif in_quotes:quote_char = charelse:quote_char = ''current_line += charelif char == '(' and not in_quotes:paren_depth += 1current_line += charelif char == ')' and not in_quotes and paren_depth > 0:paren_depth -= 1current_line += charelif char == ',' and not in_quotes and paren_depth == 0:lines.append(current_line.strip())current_line = ''else:current_line += charif current_line.strip():lines.append(current_line.strip())# 解析每个字段for line in lines:line = line.strip()if not line:continue# 跳过索引和约束if re.match(r'^(PRIMARY|UNIQUE|KEY|INDEX|CONSTRAINT|FOREIGN|CHECK)', line, re.I):continue# 匹配字段定义# 模式1: 带反引号的字段名pattern1 = r'`([^`]+)`\s+([a-zA-Z]+(?:\(\d+(?:,\s*\d+)?\))?)'# 模式2: 不带反引号的字段名pattern2 = r'(\w+)\s+([a-zA-Z]+(?:\(\d+(?:,\s*\d+)?\))?)'match = re.match(pattern1, line) or re.match(pattern2, line)if not match:continuefield_name = match.group(1)data_type = match.group(2)# 获取剩余部分remaining = line[match.end():].strip()# 分析属性is_nullable = 'NOT NULL' not in remaining.upper()is_auto_increment = 'AUTO_INCREMENT' in remaining.upper()is_primary_key = 'PRIMARY KEY' in remaining.upper()# 提取注释comment = ''comment_match = re.search(r"COMMENT\s+['\"]([^'\"]*)['\"]", remaining, re.I)if comment_match:comment = comment_match.group(1)fields.append({'字段名': field_name,'数据类型': data_type,'是否主键': '是' if is_primary_key else '否','是否自增': '是' if is_auto_increment else '否','允许为空': '是' if is_nullable else '否','注释': comment})return fieldsdef create_word_document_for_tables(tables, output_path='数据库表结构完整版.docx'):"""为所有表创建Word文档"""doc = Document()# 设置样式style = doc.styles['Normal']style.font.name = '宋体'style.font.size = Pt(10.5)# 标题title = doc.add_heading('数据库表结构文档 - 完整版', 0)title.alignment = WD_ALIGN_PARAGRAPH.CENTER# 统计信息total_tables = len(tables)total_fields = sum(len(fields) for fields in tables.values())info = doc.add_paragraph()info.add_run(f'表总数: {total_tables}').bold = Trueinfo.add_run(f'\n字段总数: {total_fields}').bold = Trueinfo.add_run(f'\n生成时间: 2026-04-02\n\n')# 表列表doc.add_heading('表列表', level=1)for i, table_name in enumerate(sorted(tables.keys()), 1):field_count = len(tables[table_name])doc.add_paragraph(f'{i}. {table_name} ({field_count}个字段)', style='List Number')doc.add_page_break()# 详细表结构doc.add_heading('表结构详情', level=1)for i, table_name in enumerate(sorted(tables.keys()), 1):fields = tables[table_name]# 表标题doc.add_heading(f'{i}. 表名: {table_name}', level=2)doc.add_paragraph(f'字段数量: {len(fields)}个\n')if fields:# 创建表格table = doc.add_table(rows=1, cols=6)table.style = 'Table Grid'# 表头headers = ['字段名', '数据类型', '是否主键', '是否自增', '允许为空', '注释']for col_idx, header in enumerate(headers):cell = table.rows[0].cells[col_idx]cell.text = headerfor para in cell.paragraphs:for run in para.runs:run.font.bold = True# 填充数据for field in fields:row = table.add_row()row.cells[0].text = field['字段名']row.cells[1].text = field['数据类型']row.cells[2].text = field['是否主键']row.cells[3].text = field['是否自增']row.cells[4].text = field['允许为空']row.cells[5].text = field['注释']# 设置列宽widths = [Cm(2.8), Cm(2.5), Cm(1.8), Cm(1.8), Cm(1.8), Cm(5.5)]for row in table.rows:for col_idx, cell in enumerate(row.cells):if col_idx < len(widths):cell.width = widths[col_idx]else:doc.add_paragraph('警告: 该表未解析到字段信息', style='Intense Quote')# 添加间距
        doc.add_paragraph()# 如果不是最后一个表，添加分页if i < total_tables:doc.add_page_break()# 保存文档
    doc.save(output_path)return output_pathdef main():"""主函数"""print("="*60)print("SQL转Word文档生成器 - 增强版")print("="*60)# 配置sql_file = "sql/risk_system_db.sql"  # 修改为您的SQL文件名output_file = "doc/risk_system_db.docx"   # 修改为您的WORD文件名if not os.path.exists(sql_file):print(f"错误: 找不到文件 '{sql_file}'")print("请确保文件存在于当前目录")# 显示当前目录文件print("\n当前目录文件:")files = os.listdir('.')sql_files = [f for f in files if f.lower().endswith('.sql')]for f in sql_files:print(f"  - {f}")if sql_files:print(f"\n建议: 修改代码中的 sql_file 变量为 '{sql_files[0]}'")returnprint(f"处理SQL文件: {sql_file}")# 解析SQL文件tables = extract_all_tables_from_sql_file(sql_file)if not tables:print("错误: 未解析到任何表结构")print("可能原因:")print("1. SQL文件格式不正确")print("2. 文件编码不是UTF-8")print("3. SQL语句格式不标准")returnprint(f"\n解析完成:")print(f"  表总数: {len(tables)}")total_fields = sum(len(fields) for fields in tables.values())print(f"  字段总数: {total_fields}")# 显示表信息print("\n表详情:")for i, (table_name, fields) in enumerate(sorted(tables.items()), 1):print(f"  {i:2d}. {table_name:30s} - {len(fields):3d} 个字段")if len(fields) > 0:print(f"      示例字段: {fields[0]['字段名']} ({fields[0]['数据类型']})")# 生成Word文档print(f"\n生成Word文档...")output_path = create_word_document_for_tables(tables, output_file)print(f"✓ 文档已生成: {output_path}")print(f"✓ 请查看生成的文档验证字段数量")if __name__ == "__main__":main()

    # 配置，主要修改以下2个地方，在python编辑器或者服务器上面执行。sql_file = "sql/risk_system_db.sql"  # 修改为您的SQL文件名output_file = "doc/risk_system_db.docx"   # 修改为您的WORD文件名

# 执行命令 - 基本用法
python 文件名.py

# 如果系统中有多个Python版本
python3 文件名.py

查看全文

http://www.jsqmd.com/news/601983/

网络工程师和网络研发工程师都是从事什么的职业？（来源网络，原创）

Aide让大师帮你改代码：专家级代码优化完全解析

Silex开源社区贡献指南：如何参与这个自由软件项目

告别答辩 PPT 返工！Paperxie AI 一键生成，学术风模板直接套用

Linux查看日志常用命令 - 尼卡

分析北京做私人抗衰能预防大病的品牌，推荐哪家 - 工业品牌热点

2026年薄片产线革新：分层夹爪如何适配超薄薄片零损伤抓取？ - 品牌2026

云原生应用的多环境部署策略

Pixel Script Temple参数详解：LoRA秩（Rank）对剧本专业度与风格稳定性的权衡

探讨SOCKS5代理使用教程，美迅代理性价比高不高？ - mypinpai

EdB Prepare Carefully：解决RimWorld开局规划难题的精细化配置方案

the-glorious-dotfiles 锁屏模块详解：PAM 集成与面部捕获

分析北京做私人抗衰能改善精力的推荐哪家 - 工业推荐榜

VCF 部署后实验室一键优化教程

新手福音：无需配置环境，在快马平台用AI理解openclaw核心概念

窗口像素重构技术：重新定义显示分辨率控制范式

SOCKS5代理安装教程哪家好用，该怎么选购 - 工业设备

resty完整用户指南：从基础操作到高级配置

天谋科技入选北京市 2026 年第一批专精特新中小企业

Cheating Daddy终极故障排除指南：10个常见问题与解决方案

终极Goyo.vim配置指南：打造完美无干扰写作环境的10个技巧

深入拆解 Kiro Spec 模式与 Amazon Bedrock AgentCore：Multi-Agent 金融系统从规范生成到 Firecracker microVM 部署

tract性能对比：在Raspberry Pi上比TensorFlow-Lite快3倍的神经网络推理引擎

Tubular多平台支持详解：YouTube、SoundCloud、PeerTube一站式解决方案终极指南

探讨2026年干法造粒机费用，怀科机械长期使用更省成本 - 工业品牌热点

利用Cloudflare实现未备案域名的301重定向全攻略

探寻北京私人糖尿病管理哪家好，远航健康是不错之选 - myqiye

Parcel与CI/CD集成终极指南：自动化构建部署流水线实战

Claude Code 接入开源模型实战：SageMaker 部署 Kimi/GLM + LiteLLM 路由降本 70%

2026年柔性气爪品牌推荐：助力产线柔性化升级的实力厂家 - 品牌2026

mysql导出sql脚本，通过python脚本生成数据库word文档

相关文章：