10.14工作第六天

工作内容:
一、纠正大表中的street_id字段
1.删除tc_region中错误的数据(两条重复其中在大表中没出现过的视为错误数据)
2.模糊匹配找出base表中有但是tc_region表中没有的数据(找完看看周哥那有region_id么)进而完善base表
3.根据base表中的名称id对应关系把大表中的street_id纠正

二、试着把base中的所有数据挂到tc_region 这棵树上

sql语句缓存
1.新建一个tc_region副本tc_region_rev

create table if not exists tc_region_rev(like tc_region);
insert into tc_region_rev select * from tc_region;

  

2.tc_region表中的问题数据处理

update tc_region_rev set senior_id=6 where region_name='双环邨街道';
delete from tc_region_rev where region_name='古林街' and region_id=277;
delete from tc_region_rev where region_name='古林街道社区' and region_id=10177;
delete from tc_region_rev where region_name='中塘镇' and region_id=289;
delete from tc_region_rev where region_name='中塘镇社区' and region_id=10189;
delete from tc_region_rev where region_name='太平镇' and region_id=264;
delete from tc_region_rev where region_name='太平镇社区' and region_id=10164;
delete from tc_region_rev where region_name='万新街道' and region_id=167;
delete from tc_region_rev where region_name='万新街道社区' and region_id=10067;
delete from tc_region_rev where region_name='高新区' and region_id=100259;
delete from tc_region_rev where region_name='海滨街道社区' and region_id=10183;
insert into tc_region_rev values (2000001,'120106012000',null,null,null,null,'和苑街道',3,6,null,null,null,null,null,null);
insert into tc_region_rev values (2000002,'120106012001',null,null,null,null,'和苑家园社区',4,2000002,null,null,null,null,null,null);
insert into tc_region_rev values (2000003,'120106012002',null,null,null,null,'全和园社区',4,2000003,null,null,null,null,null,null);
insert into tc_region_rev values (2000004,'120106012003',null,null,null,null,'梦和园社区',4,2000004,null,null,null,null,null,null);
insert into tc_region_rev values (2000005,'120106012004',null,null,null,null,'康和园社区',4,2000005,null,null,null,null,null,null);
insert into tc_region_rev values (2000006,'120106012005',null,null,null,null,'营和园社区',4,2000006,null,null,null,null,null,null);
insert into tc_region_rev values (2000007,'120106012006',null,null,null,null,'名景家园社区',4,2000007,null,null,null,null,null,null);
insert into tc_region_rev values (2000011,'120106X01000',null,null,null,null,'铁路护路网格',3,120106022,null,null,null,null,null,null);
insert into tc_region_rev values (2000012,'120106X01001',null,null,null,null,'行政执法一科',4,2000012,null,null,null,null,null,null);
insert into tc_region_rev values (2000013,'120106X01002',null,null,null,null,'行政执法二科',4,2000013,null,null,null,null,null,null);

  

3.mysql中某个字段重复数据的查询
思路:先用group by 对该字段进行分组,然后用having筛选count(1)>1其中(1)表示查询表的第一个字段

select region_name,count(*) from tc_region_rev group by region_name having count(1)>1;
select region_name from tc_region_rev group by region_name having count(1)>1;
select * from tc_region_rev where region_name in(select region_name from tc_region_rev group by region_name having count(1)>1);

  


4.找出base表模糊匹配tc_region表的困难
(1).从大表筛特殊问题数据。

select distinct street_name from to_stat_rev 
where street_name in('北塘街','北塘街道','俵口乡','俵口镇','茶淀街','茶淀街道','赤龙南镇','赤龙北街道','赤龙南街道','大白庄街道','
大白庄镇','大港街','大港街道','大港水库','大沽街','大沽街道','大寺镇','东马圈镇','港镇','高新区','古林街','古林街道','
生态城','中新生态城管理区','广源街','广源街道','海滨街','汉沽街','汉沽街道','杭州道','杭州道街道','胡家园街','胡家园街道','
华康街道','华明新家园街道','华新街道','芥园街道','芥园道街道','科技园区南区','口东街道','口东镇','廉庄子乡','廉庄镇','临港工业区','
芦台开发区海北镇','南港工业区','潘庄农场','青甸洼','青源街','青源街道','清河农场','曙光农场','双港新家园街道','
双环邨街道','双环村街道','双新街道','孙各庄乡','孙各庄满族乡','太湖路街道','塘沽街','塘沽街道','天津滨海国际机场','
天津经济技术开发区西区','天津铁厂街道','天津经济技术开发区中区','铁路护路网格','未来科技城南区','武清区开发区','
新北街','新北街道','新村街','新村街道','新港街','新港街道','新河街','新河街道','于桥水库','运河西街道','寨上街','寨上街道','
周良庄街道','周良街道');

  

5.创建tc_region与base_region的街名对应关系表

create table 'tc_base'(
'tc_base_id' int auto_increment primary key,
`tc_region_name` varchar(80)DEFAULT NULL,

street_name` varchar(50) DEFAULT NULL,

)

  

原文地址:https://www.cnblogs.com/StarZhai/p/11669504.html