工作需要,简单的写了一个互导的小功能,对于量大的数据处理还有待优化

多的不说了,直接上代码,需要的可以看看代码注释

欢迎批评指正 :)


##coding=utf8
#单线程,分批导入
#Author : Jeen @ 2013-7
import os,sys,MySQLdb,cx_Oracle,math,time  # python version 2.7.5
os.environ['NLS_LANG']="AMERICAN_AMERICA.AL32UTF8"
reload(sys)
sys.setdefaultencoding('utf8')
fromto = 'mysql2oracle' # mysql2oracle : Export Data FROM Mysql To Oracle
#fromto = 'oracle2mysql' # oracle2mysql : Export Data FROM Oracle To Mysql
from_tables = [ #导出的 表 名称
'P1_WJ_TEST_LANG_SHOP',
'P1_WJ_TEST_LANG_PRODUCT',
'P1_WJ_TEST_LANG_PRODUCT_IMAGE'
] # Data Export From
to_tables = from_tables # Data Import To #导入的 表 名称
#注意:表名需按顺序对应 表名可以不一样  但表结构必须一致  如果需要保留 ID 请修改 get_columns 方法中的相关字符串替换代码
rows_limit = 1000    #分批导入  建议设置不要超过 8000
time_sleep = 1      #分批导入之后等待  n 秒
#-Mysql Database Config
mysql_host = '127.0.0.1'
mysql_user = 'spider'
mysql_pass = 'spider'
mysql_dbname = 'spider'
mysql_port = 3306
#-Oracle Database Config
oracle_host = '192.168.1.222'
oracle_user = 'spider'
oracle_pass = 'spider'
oracle_sid = 'xe'#服务名
oracle_port = 1521
def get_columns(results,coltype) :  #构建部分查询语句的方法
        if len(results) == 0 : return ''
        t = ''
        for result in results :
            t += ', `'+''.join(result) +'`' #mysql 中需要用到的特殊字符
        mysql_columns = t.replace(', `ID`, ','') #移除自增的 ID 列
        oracle_columns = mysql_columns.replace('`','') #Oracle中  去除特殊符号
        if coltype == 'from_mysql' :
            return mysql_columns
        elif coltype == 'from_oracle' :
            return oracle_columns
        elif coltype == 'to_mysql' :
            t = oracle_columns.split(',')
            for i in range(len(t)) :
                t[i] = '%s'
            return  ' ('+mysql_columns+') values ('+','.join(t)+') ' #构建mysql 插入 SQL 片段
        elif coltype == 'to_oracle' :
            t = oracle_columns.split(',')
            for i in range(len(t)) :
                t[i] = ':'+str(i)
            return  ' ('+oracle_columns+') values ('+','.join(t)+') ' #构建Oracle 插入 SQL 片段
        else :
            return ''
try :
    # connect to Mysql
    mysql_conn = MySQLdb.connect(host=mysql_host,user=mysql_user,passwd=mysql_pass,port=mysql_port,db=mysql_dbname,charset='utf8')
    # connect to Oracle
    oracle_dsn = cx_Oracle.makedsn(oracle_host,oracle_port,oracle_sid)
    oracle_conn = cx_Oracle.connect(oracle_user,oracle_pass,oracle_dsn)
    #完成数据库连接
    if fromto == 'mysql2oracle' : # Data from Mysql to Oracle
        for i in range(len(from_tables)) : #循环载入需要导的表
            from_tb = from_tables[i] #导出表
            to_tb = to_tables[i] #导入表
            mysql_cur = mysql_conn.cursor()
            #sql = "select COLUMN_NAME from information_schema.columns where table_name='"+from_tb+"'"
            # 获取 mysql 表 列名, 如希望使用上述SQL方法  请重构 columns_name 的值
            sql = "select * from "+from_tb+" limit 0"
            mysql_cur.execute(sql); #print mysql_cur.description
            columns_name = [col[0] for col in mysql_cur.description] ; #print columns_name
            columns = get_columns(columns_name,'from_mysql'); #print columns
            if columns == '' : raise EOFError('columns error')
            sql = "select count(*) from "+from_tb; #print sql;#统计行数
            mysql_cur.execute(sql)
            results = mysql_cur.fetchone()
            rows_count = results[0]
            mysql_cur.close()
            print 'Total %s rows from Table:%s found in Mysql:%s .\r\nThis program will select %s time(s)(limit %s rows per time) \r\n ... | Start ...' % (rows_count,from_tb,mysql_dbname,int(math.ceil(float(rows_count)/rows_limit)),rows_limit)
            j = 0
            #分批导入
            while j*rows_limit < rows_count :
                mysql_cur = mysql_conn.cursor()
                #构建查询语句
                sql = "select %s from %s limit %s,%s" % (columns,from_tb,j*rows_limit,rows_limit);  #print sql;
                mysql_cur.execute(sql) #执行查询
                results = mysql_cur.fetchall() #保存查询结果
                mysql_cur.close()
                for record in results: #循环读取查询结果
                    oracle_cur = oracle_conn.cursor()
                    sql = "insert into " + to_tb + get_columns(columns_name,'to_oracle') #构建插入语句
                    oracle_cur.execute(sql,record)  #执行插入
                    oracle_conn.commit() #提交
                    oracle_cur.close()
                j += 1; print 'The (%s)th import end. (%s)rows..' % (j,len(results))
                time.sleep(time_sleep) #wait for several seconds
            print 'Data import to table:' + to_tb + ' in Oracle:'+oracle_sid+'    |  Complete ~!  \r\n '
        print '\r\nAll Tables Import Complete ~!' #完成导入
                                     
    #以下部分为 Oracle 导入到Mysql的 逻辑代码, 请直接忽略
    elif fromto == 'oracle2mysql' : # Data from Oracle to Mysql
        for i in range(len(from_tables)) :
            from_tb = from_tables[i]
            to_tb = to_tables[i]
            oracle_cur = oracle_conn.cursor()
            #sql = "select c.column_name from SYS.ALL_CONS_COLUMNS c where c.owner='"+oracle_user+"' and c.table_name='"+from_tb+"'"
            # 获取 Oracle 表 列名, 如希望使用上述SQL方法  请重构 columns_name 的值
            sql = "select * from "+from_tb+" where rownum<1"
            oracle_cur.execute(sql)
            columns_name = [col[0] for col in oracle_cur.description] ;#print columns_name
            columns = get_columns(columns_name,'from_oracle'); #print columns
            if columns == '' : raise EOFError('columns error')
            sql = "select count(*) from "+from_tb; #print sql;
            oracle_cur.execute(sql)
            results = oracle_cur.fetchone()
            rows_count = results[0]
            oracle_cur.close()
            print 'Total %s rows from Table:%s found in Oracle:%s .\r\nThis program will select %s time(s)(limit %s rows per time) \r\n ... | Start ...' % (rows_count,from_tb,oracle_sid,int(math.ceil(float(rows_count)/rows_limit)),rows_limit)
            j = 0
            while j*rows_limit < rows_count :
                oracle_cur = oracle_conn.cursor()
                sql = "select %s from (select rownum rn,%s from %s where rownum <= %s) where rn > %s" % (columns,columns,from_tb,(j+1)*rows_limit,j*rows_limit);  #print sql;
                oracle_cur.execute(sql)
                results = oracle_cur.fetchall()
                oracle_cur.close()
                for record in results:
                    mysql_cur = mysql_conn.cursor()
                    sql = "insert into " + to_tb + get_columns(columns_name,'to_mysql')
                    mysql_cur.execute(sql,record)
                    mysql_conn.commit()
                    mysql_cur.close()
                j += 1; print 'The (%s)th import end.(%s)rows ..' % (j,len(results))
                time.sleep(time_sleep) #wait for several seconds
            print 'Data import to table:' + to_tb + ' in Mysql:'+mysql_dbname+'    |  Complete ~!  \r\n '
        print '\r\nAll Tables Import Complete ~!'
    else :
        print "unknow value of 'fromto' \r\nmake sure 'fromto' like 'mysql2oracle' or 'oracle2mysql' ...."
    #-close database connection
    mysql_conn.close()
    oracle_conn.close()
except EOFError,e :
    print e
finally :
    print 'Database Export/Import Python Code Excute End...\r\nBye~'
    #os.system('PAUSE')