微信搜索superit|邀请体验:大数据, 数据管理、OLAP分析与可视化平台 | 赞助作者:赞助作者

python把特殊字符替换掉,词典转换

我的操作 aide_941 2℃ 0评论
import re

file_path = "F:/python/spider/牛津高阶英汉双解词典(第9版)- 带高清版图片.sql"
with open(file_path, 'r', encoding='utf-8') as f:
    file = f.read()

# Correct pattern for matching supplementary Unicode characters (U+10000 to U+10FFFF)
pattern = r'[\U00010000-\U0010FFFF]'
replacement = ''
result = re.sub(pattern, replacement, file)
with open('F:/python/spider/test.sql','w', encoding='utf-8') as ff:
   ff.write(result)

----------

/*
Navicat MySQL Data Transfer

Source Server         : localhost
Source Server Version : 50710
Source Host           : localhost:3306
Source Database       : oxf

Target Server Type    : MYSQL
Target Server Version : 50710
File Encoding         : 65001

Date: 2025-07-22 14:44:06
*/

SET FOREIGN_KEY_CHECKS=0;

-- ----------------------------
-- Table structure for alt
-- ----------------------------
DROP TABLE IF EXISTS alt;
CREATE TABLE alt (
  id int(11) NOT NULL,
  w varchar(50) DEFAULT NULL,
  KEY idx_alt_w (w) USING BTREE,
  KEY idx_alt_id (id)
) ENGINE=InnoDB DEFAULT CHARSET=utf8mb4;

-- ----------------------------
-- Table structure for dbinfo
-- ----------------------------
DROP TABLE IF EXISTS dbinfo;
CREATE TABLE dbinfo (
  id int(11) NOT NULL,
  dbname varchar(50) DEFAULT NULL,
  author varchar(50) DEFAULT NULL,
  version varchar(50) DEFAULT NULL,
  direction varchar(50) DEFAULT NULL,
  origLang varchar(50) DEFAULT NULL,
  destLang varchar(50) DEFAULT NULL,
  license varchar(50) DEFAULT NULL,
  category varchar(50) DEFAULT NULL,
  description text,
  PRIMARY KEY (id)
) ENGINE=InnoDB DEFAULT CHARSET=utf8mb4;

-- ----------------------------
-- Table structure for dbinfo_extra
-- ----------------------------
DROP TABLE IF EXISTS dbinfo_extra;
CREATE TABLE dbinfo_extra (
  id int(11) NOT NULL,
  name text,
  value text,
  PRIMARY KEY (id),
  UNIQUE KEY id (id)
) ENGINE=InnoDB DEFAULT CHARSET=utf8mb4;

-- ----------------------------
-- Table structure for word
-- ----------------------------
DROP TABLE IF EXISTS word;
CREATE TABLE word (
  id int(10) DEFAULT NULL,
  w varchar(100) DEFAULT NULL,
  m longtext
) ENGINE=InnoDB DEFAULT CHARSET=utf8mb4;
[mysqld]
port=3306
basedir=F:\mysql-5.7.10-winx64
datadir=F:\mysql-5.7.10-winx64\Data
max_connections=200
max_connect_errors=10
character-set-server=utf8
default-storage-engine=INNODB
explicit_defaults_for_timestamp=true
bind-address = 0.0.0.0
sql_mode=STRICT_TRANS_TABLES,NO_ZERO_IN_DATE,NO_ZERO_DATE,ERROR_FOR_DIVISION_BY_ZERO,NO_ENGINE_SUBSTITUTION
[mysql]
default-character-set=utf8
[client]
port=3306
default-character-set=utf8

 

转载请注明:SuperIT » python把特殊字符替换掉,词典转换

喜欢 (0)or分享 (0)

您必须 登录 才能发表评论!