| 123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263 |
- <?php
- /*
- 从旧数据表中提取数据插入到新的表
- 插入时用uuid判断是否曾经插入
- 曾经插入就不插入了
- */
- require_once __DIR__."/../../../public/app/config.php";
- require_once __DIR__."/../../../public/app/public/snowflakeid.php";
- set_exception_handler(function($e){
- fwrite(STDERR,"error-msg:".$e->getMessage().PHP_EOL);
- fwrite(STDERR,"error-file:".$e->getFile().PHP_EOL);
- fwrite(STDERR,"error-line:".$e->getLine().PHP_EOL);
- exit;
- });
- $start = time();
- # 雪花id
- $snowflake = new SnowFlakeId();
- $fpError = fopen(__DIR__.'/log/'.basename($_SERVER['PHP_SELF'],'.php').".err.data.csv",'w');
- # 更新索引表
- $src_db=_SQLITE_DB_WBW_;#源数据库
- $src_table=_SQLITE_TABLE_DICT_WBW_;#源表名
- $dest_db=_PG_DB_WBW_;#目标数据库
- $dest_table=_PG_TABLE_DICT_WBW_;#目标表名
- echo "migarate user dict".PHP_EOL;
- #打开源数据库
- $PDO_SRC = new PDO($src_db,_DB_USERNAME_,_DB_PASSWORD_,array(
- PDO::ATTR_PERSISTENT=>true,
- PDO::SQLITE_ATTR_OPEN_FLAGS => PDO::SQLITE_OPEN_READONLY
- ));
- $PDO_SRC->setAttribute(PDO::ATTR_ERRMODE, PDO::ERRMODE_EXCEPTION);
- echo "open src".PHP_EOL;
- #打开目标数据库
- $PDO_DEST = new PDO($dest_db,_DB_USERNAME_,_DB_PASSWORD_,array(PDO::ATTR_PERSISTENT=>true));
- $PDO_DEST->setAttribute(PDO::ATTR_ERRMODE, PDO::ERRMODE_EXCEPTION);
- echo "open dest".PHP_EOL;
- #删除目标数据表中全部数据
- fwrite(STDOUT,"delete dest".PHP_EOL);
- $query = "delete from $dest_table where true;";
- $stmtDest = $PDO_DEST->prepare($query);
- $stmtDest->execute();
- $queryInsert = "INSERT INTO ".$dest_table."
- (
- id,
- word ,
- type,
- grammar,
- parent,
- mean,
- note,
- factors,
- factormean,
- status,
- source,
- language,
- confidence,
- creator_id,
- ref_counter,
- create_time,
- created_at,
- updated_at
- )
- VALUES (? , ? , ? , ? ,? ,? ,? ,? ,? ,? ,? , ?,?,?,?,?,to_timestamp(?),to_timestamp(?))";
- echo "read from orginal".PHP_EOL;
- $commitData = [];
- $allInsertCount = 0;
- $allSrcCount = 0;
- $count = 0;
- #从源数据表中读取
- $query = "SELECT * FROM ".$src_table;
- $stmtSrc = $PDO_SRC->prepare($query);
- $stmtSrc->execute();
- while($srcData = $stmtSrc->fetch(PDO::FETCH_ASSOC)){
- $allSrcCount++;
- #插入目标表
- if(empty($srcData["pali"]) ){
- fwrite(STDERR,"pali is null id=".$srcData["id"].PHP_EOL);
- fputcsv($fpError,$srcData);
- continue;
- }
- if(empty($srcData["creator"]) ){
- fwrite(STDERR,"creator is null id=".$srcData["id"].PHP_EOL);
- fputcsv($fpError,$srcData);
- continue;
- }
- $commitData[] = array(
- $snowflake->id(),
- $srcData["pali"],
- $srcData["type"],
- $srcData["gramma"],
- $srcData["parent"],
- $srcData["mean"],
- $srcData["note"],
- $srcData["factors"],
- $srcData["factormean"],
- $srcData["status"],
- "_SYS_USER_WBW_",
- $srcData["language"],
- $srcData["confidence"],
- $srcData["creator"],
- $srcData["ref_counter"],
- $srcData["time"],
- $srcData["time"],
- $srcData["time"]
- );
- $count++;
- $allInsertCount++;
-
- if($count ==10000){
- #10000行插入一次
- $PDO_DEST->beginTransaction();
- $stmtDEST = $PDO_DEST->prepare($queryInsert);
- foreach ($commitData as $key => $value) {
- try{
- $stmtDEST->execute($value);
- }catch(PDOException $e){
- fwrite(STDERR,$e->getMessage().PHP_EOL);
- fwrite(STDERR,implode(',',$value).PHP_EOL);
- exit;
- }
- }
- // 提交更改
- $PDO_DEST->commit();
- $commitData = [];
- echo "finished $count".PHP_EOL;
- $count=0;
- }
- if($allSrcCount % 10000 ==0){
- echo "find from src table $allSrcCount / $allInsertCount is new.".PHP_EOL;
- }
- }
- if($count>0){
- #最后的没有到10000的数据插入
- $PDO_DEST->beginTransaction();
- $stmtDEST = $PDO_DEST->prepare($queryInsert);
- foreach ($commitData as $key => $value) {
- $stmtDEST->execute($value);
- }
- // 提交更改
- $PDO_DEST->commit();
- $commitData = [];
- echo "finished $count".PHP_EOL;
- }
- echo "insert done $allInsertCount in $allSrcCount ".PHP_EOL;
- # 更新索引表
- $src_table=_SQLITE_TABLE_DICT_WBW_INDEX_;#源表名
- $src_word_table=_SQLITE_TABLE_DICT_WBW_;#源word表名
- echo "migarating usr dict index ".PHP_EOL;
- // 开始一个事务,关闭自动提交
- $commitData = [];
- $allInsertCount = 0;
- $allSrcCount = 0;
- $count = 0;
- #从源数据表中读取
- $query = "SELECT * FROM ".$src_table;
- $stmtSrc = $PDO_SRC->prepare($query);
- $stmtSrc->execute();
- while($srcData = $stmtSrc->fetch(PDO::FETCH_ASSOC)){
- $allSrcCount++;
- #插入目标表
- $wordIndex = $srcData["word_index"];
- #查询目标表中的数据
- $queryExsit = "SELECT * FROM ".$src_word_table." WHERE id = ? ";
- $getWord = $PDO_SRC->prepare($queryExsit);
- $getWord->execute(array($wordIndex));
- $exist = $getWord->fetch(PDO::FETCH_ASSOC);
- if($exist){
- if(empty($srcData["user_id"]) ){
- fwrite(STDERR,"index user_id is null id=".$srcData["id"].PHP_EOL);
- fputcsv($fpError,$srcData);
- continue;
- }
- if(empty($exist["pali"]) ){
- fwrite(STDERR,"pali is null id=".$srcData["id"].PHP_EOL);
- continue;
- }
- if(empty($exist["creator"]) ){
- fwrite(STDERR,"creator is null id=".$srcData["id"].PHP_EOL);
- continue;
- }
- $commitData[] = array(
- $snowflake->id(),
- $exist["pali"],
- $exist["type"],
- $exist["gramma"],
- $exist["parent"],
- $exist["mean"],
- $exist["note"],
- $exist["factors"],
- $exist["factormean"],
- (int)$exist["status"],
- "_USER_WBW_",
- $exist["language"],
- $exist["confidence"],
- $srcData["user_id"],
- $exist["ref_counter"],
- $exist["time"],
- $exist["time"],
- $exist["time"]
- );
- $count++;
- $allInsertCount++;
- if($count === 10000){
- $PDO_DEST->beginTransaction();
- $stmtDEST = $PDO_DEST->prepare($queryInsert);
- foreach ($commitData as $key => $value) {
- # code...
- $stmtDEST->execute($value);
- }
- // 提交更改
- $PDO_DEST->commit();
- $commitData = [];
- echo "finished $count".PHP_EOL;
- $count = 0;
- }
- }else{
- fwrite(STDERR,"error: no word index - $wordIndex".PHP_EOL);
- }
- if($allSrcCount % 10000 ==0){
- fwrite(STDOUT,"find from src table $allSrcCount / $allInsertCount is new.".PHP_EOL) ;
- }
- }
- if($count>0){
- #最后的没有到10000的数据插入
- $PDO_DEST->beginTransaction();
- $stmtDEST = $PDO_DEST->prepare($queryInsert);
- foreach ($commitData as $key => $value) {
- # code...
- $stmtDEST->execute($value);
- }
- // 提交更改
- $PDO_DEST->commit();
- $commitData = [];
- fwrite(STDOUT,"finished $count".PHP_EOL);
- }
- fwrite(STDOUT,"insert done $allInsertCount in $allSrcCount ".PHP_EOL);
- fwrite(STDOUT, "all done in ".(time()-$start)."s".PHP_EOL);
|