123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636 |
- # encoding=utf8
- """芋道系统数据库迁移工具
- Author: dhb52 (https://gitee.com/dhb52)
- pip install simple-ddl-parser
- """
- import pathlib
- import re
- import time
- from abc import ABC, abstractmethod
- from typing import Dict, Tuple
- from simple_ddl_parser import DDLParser
- PREAMBLE = """/*
- Yudao Database Transfer Tool
- Source Server Type : MySQL
- Target Server Type : {db_type}
- Date: {date}
- */
- """
- def load_and_clean(sql_file: str) -> str:
- """加载源 SQL 文件,并清理内容方便下一步 ddl 解析
- Args:
- sql_file (str): sql文件路径
- Returns:
- str: 清理后的sql文件内容
- """
- REPLACE_PAIR_LIST = (
- (" CHARACTER SET utf8mb4 COLLATE utf8mb4_unicode_ci ", " "),
- (" KEY `", " INDEX `"),
- ("UNIQUE INDEX", "UNIQUE KEY"),
- ("b'0'", "'0'"),
- ("b'1'", "'1'"),
- )
- content = open(sql_file).read()
- for replace_pair in REPLACE_PAIR_LIST:
- content = content.replace(*replace_pair)
- content = re.sub(r"ENGINE.*COMMENT", "COMMENT", content)
- content = re.sub(r"ENGINE.*;", ";", content)
- return content
- class Convertor(ABC):
- def __init__(self, src: str, db_type) -> None:
- self.src = src
- self.db_type = db_type
- self.content = load_and_clean(self.src)
- self.table_script_list = re.findall(r"CREATE TABLE [^;]*;", self.content)
- @abstractmethod
- def translate_type(self, type: str, size: None | int | Tuple[int]) -> str:
- """字段类型转换
- Args:
- type (str): 字段类型
- size (None | int | Tuple[int]): 字段长度描述, 如varchar(255), decimal(10,2)
- Returns:
- str: 类型定义
- """
- pass
- @abstractmethod
- def gen_create(self, table_ddl: Dict) -> str:
- """生成 create 脚本
- Args:
- table_ddl (Dict): 表DDL
- Returns:
- str: 生成脚本
- """
- pass
- @abstractmethod
- def gen_pk(self, table_name: str) -> str:
- """生成主键定义
- Args:
- table_name (str): 表名
- Returns:
- str: 生成脚本
- """
- pass
- @abstractmethod
- def gen_index(self, table_ddl: Dict) -> str:
- """生成索引定义
- Args:
- table_ddl (Dict): 表DDL
- Returns:
- str: 生成脚本
- """
- pass
- @abstractmethod
- def gen_comment(self, table_sql: str, table_name: str) -> str:
- """生成字段/表注释
- Args:
- table_sql (str): 原始表SQL
- table_name (str): 表名
- Returns:
- str: 生成脚本
- """
- pass
- @abstractmethod
- def gen_insert(self, table_name: str) -> str:
- """生成 insert 语句块
- Args:
- table_name (str): 表名
- Returns:
- str: 生成脚本
- """
- pass
- def print(self):
- """打印转换后的sql脚本到终端"""
- print(
- PREAMBLE.format(
- db_type=self.db_type,
- date=time.strftime("%Y-%m-%d %H:%M:%S"),
- )
- )
- error_scripts = []
- for table_sql in self.table_script_list:
- ddl = DDLParser(table_sql.replace("`", "")).run()
- # 如果parse失败, 需要跟进
- if len(ddl) == 0:
- error_scripts.append(table_sql)
- continue
- table_ddl = ddl[0]
- table_name = table_ddl["table_name"]
- # 忽略 quartz 的内容
- if table_name.lower().startswith("qrtz"):
- continue
- # 为每个表生成个5个基本部分
- create = self.gen_create(table_ddl)
- pk = self.gen_pk(table_name)
- index = self.gen_index(table_ddl)
- comment = self.gen_comment(table_sql, table_name)
- inserts = self.gen_insert(table_name)
- # 组合当前表的DDL脚本
- script = f"""{create}
- {pk}
- {index}
- {comment}
- {inserts}
- """
- # 清理
- script = re.sub("\n{3,}", "\n\n", script).strip() + "\n"
- print(script)
- # 将parse失败的脚本打印出来
- if error_scripts:
- for script in error_scripts:
- print(script)
- class PostgreSQLConvertor(Convertor):
- def __init__(self, src):
- super().__init__(src, "PostgreSQL")
- def translate_type(self, type, size):
- """类型转换"""
- type = type.lower()
- if type == "varchar":
- return f"varchar({size})"
- if type == "int":
- return "int4"
- if type == "bigint" or type == "bigint unsigned":
- return "int8"
- if type == "datetime":
- return "timestamp"
- if type == "bit":
- return "bool"
- if type in ("tinyint", "smallint"):
- return "int2"
- if type == "text":
- return "text"
- if type in ("blob", "mediumblob"):
- return "bytea"
- if type == "decimal":
- return (
- f"numeric({','.join(str(s) for s in size)})" if len(size) else "numeric"
- )
- def gen_create(self, ddl: Dict) -> str:
- """生成 create"""
- def _generate_column(col):
- name = col["name"].lower()
- if name == "deleted":
- return "deleted int2 NOT NULL DEFAULT 0"
- type = col["type"].lower()
- full_type = self.translate_type(type, col["size"])
- nullable = "NULL" if col["nullable"] else "NOT NULL"
- default = f"DEFAULT {col['default']}" if col["default"] is not None else ""
- return f"{name} {full_type} {nullable} {default}"
- table_name = ddl["table_name"].lower()
- columns = [f"{_generate_column(col).strip()}" for col in ddl["columns"]]
- script = f"""-- ----------------------------
- -- Table structure for {table_name}
- -- ----------------------------
- DROP TABLE IF EXISTS {table_name};
- CREATE TABLE {table_name} (
- {',\n '.join(columns)}
- );"""
- return script
- def gen_comment(self, table_sql, table_name) -> str:
- """生成字段及表的注释"""
- script = ""
- for line in table_sql.split("\n"):
- match = re.match(r"^`([^`]+)`.* COMMENT '([^']+)'", line.strip())
- if match:
- script += f"COMMENT ON COLUMN {table_name}.{match.group(1)} IS '{match.group(2).replace('\\n', '\n')}';\n"
- match = re.search(r"COMMENT \= '([^']+)';", table_sql)
- table_comment = match.group(1) if match else None
- if table_comment:
- script += f"COMMENT ON TABLE {table_name} IS '{table_comment}';\n"
- return script
- def gen_pk(self, table_name) -> str:
- """生成主键定义"""
- return f"ALTER TABLE {table_name} ADD CONSTRAINT pk_{table_name} PRIMARY KEY (id);\n"
- def gen_index(self, ddl) -> str:
- """生成 index"""
- def generate_columns(columns):
- keys = [
- f"{col['name'].lower()}{" " + col['order'].lower() if col['order'] != 'ASC' else ''}"
- for col in columns[0]
- ]
- return ", ".join(keys)
- script = ""
- for no, index in enumerate(ddl["index"], 1):
- columns = generate_columns(index["columns"])
- table_name = ddl["table_name"].lower()
- script += (
- f"CREATE INDEX idx_{table_name}_{no:02d} ON {table_name} ({columns});\n"
- )
- return script
- def gen_insert(self, table_name) -> str:
- """生成 insert 语句,以及根据最后的 insert id+1 生成 Sequence"""
- PREFIX = f"INSERT INTO `{table_name}`"
- # 收集 `table_name` 对应的 insert 语句
- inserts = []
- for line in self.content.split("\n"):
- if line.startswith(PREFIX):
- head, tail = line.replace(PREFIX, "").split(" VALUES ", maxsplit=1)
- head = head.strip().replace("`", "").lower()
- tail = tail.strip().replace(r"\"", '"')
- script = f"INSERT INTO {table_name.lower()} {head} VALUES {tail}"
- # bit(1)数据转换
- script = script.replace("b'0'", "'0'").replace("b'1'", "'1'")
- inserts.append(script)
- ## 生成 insert 脚本
- script = ""
- last_id = 0
- if inserts:
- script += f"""\n\n-- ----------------------------
- -- Records of {table_name.lower()}
- -- ----------------------------
- -- @formatter:off
- BEGIN;
- {'\n'.join(inserts)}
- COMMIT;
- -- @formatter:on"""
- match = re.search(r"VALUES \((\d+),", inserts[-1])
- if match:
- last_id = int(match.group(1))
- # 生成 Sequence
- script += (
- "\n\n"
- + f"""DROP SEQUENCE IF EXISTS {table_name}_seq;
- CREATE SEQUENCE {table_name}_seq
- START {last_id + 1};"""
- )
- return script
- class OracleConvertor(Convertor):
- def __init__(self, src):
- super().__init__(src, "Oracle")
- def translate_type(self, type, size: None | int | Tuple[int]):
- """类型转换"""
- type = type.lower()
- if type == "varchar":
- return f"varchar2({size if size < 4000 else 4000})"
- if type == "int":
- return "number"
- if type == "bigint" or type == "bigint unsigned":
- return "number"
- if type == "datetime":
- return "date"
- if type == "bit":
- return "number(1,0)"
- if type in ("tinyint", "smallint"):
- return "smallint"
- if type == "text":
- return "clob"
- if type in ("blob", "mediumblob"):
- return "blob"
- if type == "decimal":
- return (
- f"number({','.join(str(s) for s in size)})" if len(size) else "number"
- )
- def gen_create(self, ddl) -> str:
- """生成 CREATE 语句"""
- def generate_column(col):
- name = col["name"].lower()
- if name == "deleted":
- return "deleted number(1,0) DEFAULT 0 NOT NULL"
- type = col["type"].lower()
- full_type = self.translate_type(type, col["size"])
- nullable = "NULL" if col["nullable"] else "NOT NULL"
- default = f"DEFAULT {col['default']}" if col["default"] is not None else ""
- return f"{'\"size\"' if name == "size" else name } {full_type} {default} {nullable}"
- table_name = ddl["table_name"].lower()
- columns = [f"{generate_column(col).strip()}" for col in ddl["columns"]]
- script = f"""-- ----------------------------
- -- Table structure for {table_name}
- -- ----------------------------
- CREATE TABLE {ddl['table_name'].lower()} (
- {',\n '.join(columns)}
- );"""
- # oracle INSERT '' 不能通过 NOT NULL 校验
- script = script.replace("DEFAULT '' NOT NULL", "DEFAULT '' NULL")
- return script
- def gen_comment(self, table_sql, table_name) -> str:
- script = ""
- for line in table_sql.split("\n"):
- match = re.search(r"`([^`]+)`.* COMMENT '([^']+)'", line)
- if match:
- script += f"COMMENT ON COLUMN {table_name}.{match.group(1)} IS '{match.group(2).replace('\\n', '\n')}';\n"
- match = re.search(r"COMMENT \= '([^']+)';", table_sql)
- table_comment = match.group(1) if match else None
- if table_comment:
- script += f"COMMENT ON TABLE {table_name} IS '{table_comment}';"
- return script
- def gen_pk(self, table_name) -> str:
- """生成主键定义"""
- return f"ALTER TABLE {table_name} ADD CONSTRAINT pk_{table_name} PRIMARY KEY (id);\n"
- def gen_index(self, table_ddl) -> str:
- """生成 INDEX 定义"""
- def generate_columns(columns):
- keys = [
- f"{col['name'].lower()}{" " + col['order'].lower() if col['order'] != 'ASC' else ''}"
- for col in columns[0]
- ]
- return ", ".join(keys)
- script = ""
- for no, index in enumerate(table_ddl["index"], 1):
- columns = generate_columns(index["columns"])
- table_name = table_ddl["table_name"].lower()
- script += (
- f"CREATE INDEX idx_{table_name}_{no:02d} ON {table_name} ({columns});\n"
- )
- return script
- def gen_insert(self, table_name) -> str:
- """拷贝 INSERT 语句"""
- PREFIX = f"INSERT INTO `{table_name}`"
- inserts = []
- for line in self.content.split("\n"):
- if line.startswith(PREFIX):
- head, tail = line.replace(PREFIX, "").split(" VALUES ", maxsplit=1)
- head = head.strip().replace("`", "").lower()
- tail = tail.strip().replace(r"\"", '"')
- script = f"INSERT INTO {table_name.lower()} {head} VALUES {tail}"
- # bit(1)数据转换
- script = script.replace("b'0'", "'0'").replace("b'1'", "'1'")
- # 对日期数据添加 TO_DATE 转换
- script = re.sub(
- r"('\d{4}-\d{2}-\d{2} \d{2}:\d{2}:\d{2}')",
- r"to_date(\g<1>, 'SYYYY-MM-DD HH24:MI:SS')",
- script,
- )
- inserts.append(script)
- ## 生成 insert 脚本
- script = ""
- last_id = 0
- if inserts:
- script += f"""\n\n-- ----------------------------
- -- Records of {table_name.lower()}
- -- ----------------------------
- -- @formatter:off
- {'\n'.join(inserts)}
- COMMIT;
- -- @formatter:on"""
- match = re.search(r"VALUES \((\d+),", inserts[-1])
- if match:
- last_id = int(match.group(1))
- # 生成 Sequence
- script += f"""
- CREATE SEQUENCE {table_name}_seq
- START WITH {last_id + 1};"""
- return script
- class SQLServerConvertor(Convertor):
- """_summary_
- Args:
- Convertor (_type_): _description_
- """
- def __init__(self, src):
- super().__init__(src, "Microsoft SQL Server")
- def translate_type(self, type, size):
- """类型转换"""
- type = type.lower()
- if type == "varchar":
- return f"nvarchar({size if size < 4000 else 4000})"
- if type == "int":
- return "int"
- if type == "bigint" or type == "bigint unsigned":
- return "bigint"
- if type == "datetime":
- return "datetime2"
- if type == "bit":
- return "varchar(1)"
- if type in ("tinyint", "smallint"):
- return "tinyint"
- if type == "text":
- return "nvarchar(max)"
- if type in ("blob", "mediumblob"):
- return "varbinary(max)"
- if type == "decimal":
- return (
- f"numeric({','.join(str(s) for s in size)})" if len(size) else "numeric"
- )
- def gen_create(self, ddl: Dict) -> str:
- """生成 create"""
- def _generate_column(col):
- name = col["name"].lower()
- if name == 'id':
- return "id bigint NOT NULL PRIMARY KEY IDENTITY"
- if name == "deleted":
- return "deleted bit DEFAULT 0 NOT NULL"
- type = col["type"].lower()
- full_type = self.translate_type(type, col["size"])
- nullable = "NULL" if col["nullable"] else "NOT NULL"
- default = f"DEFAULT {col['default']}" if col["default"] is not None else ""
- return f"{name} {full_type} {default} {nullable}"
- table_name = ddl["table_name"].lower()
- columns = [f"{_generate_column(col).strip()}" for col in ddl["columns"]]
- script = f"""-- ----------------------------
- -- Table structure for {table_name}
- -- ----------------------------
- DROP TABLE IF EXISTS {table_name};
- CREATE TABLE {table_name} (
- {',\n '.join(columns)}
- )
- GO"""
- return script
- def gen_comment(self, table_sql, table_name) -> str:
- """生成字段及表的注释"""
- script = ""
- for line in table_sql.split("\n"):
- match = re.match(r"^`([^`]+)`.* COMMENT '([^']+)'", line.strip())
- if match:
- script += f"""EXEC sp_addextendedproperty
- 'MS_Description', N'{match.group(2).replace('\\n', '\n')}',
- 'SCHEMA', N'dbo',
- 'TABLE', N'{table_name}',
- 'COLUMN', N'{match.group(1)}'
- GO
- """
- match = re.search(r"COMMENT \= '([^']+)';", table_sql)
- table_comment = match.group(1) if match else None
- if table_comment:
- script += f"""EXEC sp_addextendedproperty
- 'MS_Description', N'{table_comment}',
- 'SCHEMA', N'dbo',
- 'TABLE', N'{table_name}'
- GO
- """
- return script
- def gen_pk(self, table_name) -> str:
- """生成主键定义"""
- return ""
- def gen_index(self, ddl) -> str:
- """生成 index"""
- def generate_columns(columns):
- keys = [
- f"{col['name'].lower()}{" " + col['order'].lower() if col['order'] != 'ASC' else ''}"
- for col in columns[0]
- ]
- return ", ".join(keys)
- script = ""
- for no, index in enumerate(ddl["index"], 1):
- columns = generate_columns(index["columns"])
- table_name = ddl["table_name"].lower()
- script += f"CREATE INDEX idx_{table_name}_{no:02d} ON {table_name} ({columns})\nGO\n"
- return script
- def gen_insert(self, table_name) -> str:
- """生成 insert 语句,以及根据最后的 insert id+1 生成 Sequence"""
- PREFIX = f"INSERT INTO `{table_name}`"
- # 收集 `table_name` 对应的 insert 语句
- inserts = []
- for line in self.content.split("\n"):
- if line.startswith(PREFIX):
- head, tail = line.replace(PREFIX, "").split(" VALUES ", maxsplit=1)
- head = head.strip().replace("`", "").lower()
- tail = tail.strip().replace(r"\"", '"')
- # SQLServer: 字符串前加N,hack,是否存在替换字符串内容的风险
- tail = tail.replace(", '", ", N'").replace("VALUES ('", "VALUES (N')")
- script = f"INSERT INTO {table_name.lower()} {head} VALUES {tail}"
- # bit(1)数据转换
- script = script.replace("b'0'", "'0'").replace("b'1'", "'1'")
- # 删除 insert 的结尾分号
- script = re.sub(";$", r"\nGO", script)
- inserts.append(script)
- ## 生成 insert 脚本
- script = ""
- if inserts:
- script += f"""\n\n-- ----------------------------
- -- Records of {table_name.lower()}
- -- ----------------------------
- -- @formatter:off
- BEGIN TRANSACTION
- GO
- SET IDENTITY_INSERT {table_name.lower()} ON
- GO
- {'\n'.join(inserts)}
- SET IDENTITY_INSERT {table_name.lower()} OFF
- GO
- COMMIT
- GO
- -- @formatter:on"""
- return script
- def main():
- sql_file = pathlib.Path('../mysql/ruoyi-vue-pro.sql').resolve().as_posix()
- # convertor = PostgreSQLConvertor(sql_file)
- # convertor = OracleConvertor(sql_file)
- convertor = SQLServerConvertor(sql_file)
- convertor.print()
- if __name__ == "__main__":
- main()
|