combin_union.php 1.6 KB

1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556575859606162636465666768697071727374
  1. <!DOCTYPE html>
  2. <html>
  3. <head>
  4. </head>
  5. <body>
  6. <p><a href="index.php">Home</a></p>
  7. <h2>合并连读词表</h2>
  8. <?php
  9. $dirXmlBase="xml/";
  10. $filelist=array();
  11. $fileNums=0;
  12. $log="";
  13. if(($handle=fopen("filelist.csv",'r'))!==FALSE){
  14. while(($filelist[$fileNums]=fgetcsv($handle,0,','))!==FALSE){
  15. $fileNums++;
  16. }
  17. }
  18. $g_paliWordCounter=0;
  19. for($i=0;$i<count($filelist);$i++)
  20. {
  21. $outputFileNameHead=$filelist[$i][1];
  22. $dirXml=$outputFileNameHead."/";
  23. $inputFileName=$dirXmlBase.$dirXml.$outputFileNameHead."_un.csv";
  24. echo "doing:[$i] - $outputFileNameHead <br />";
  25. if(($handle=fopen($inputFileName,'r'))!==FALSE){
  26. $iLineNum=0;
  27. while(($data=fgetcsv($handle,0,','))!==FALSE){
  28. if($iLineNum>0){/*skip first line*/
  29. $pali=str_getcsv($data[7],'+')[0];
  30. if(isset($arrAllPaliWordsCount[$pali])){
  31. //if($arrAllPaliWordsCount[$pali][8]!=$data[2];
  32. }
  33. else{
  34. $arrAllPaliWordsCount[$pali]=$data;
  35. }
  36. $g_paliWordCounter++;
  37. }
  38. $iLineNum++;
  39. }
  40. }
  41. else{
  42. echo "open file:".$inputFileName." false<br>";
  43. }
  44. fclose($handle);
  45. }
  46. $outputfile=$dirXmlBase."all_union.csv";
  47. echo "outputfile:".$outputfile."<br>";
  48. /*union表*/
  49. if(($fp=fopen($outputfile, "w"))!==FALSE){
  50. $wordCountCsvHead=array("id","word","type","gramma","parent","mean","note","part","partmean","cf","state","delete","tag","len");
  51. fputcsv($fp,$wordCountCsvHead);
  52. foreach($arrAllPaliWordsCount as $x=>$x_value){
  53. fputcsv($fp,$x_value);
  54. }
  55. fclose($fp);
  56. echo "union 导出到:".$outputfile.".csv<br>";
  57. }
  58. else{
  59. echo "can not open csv file. filename="."_count.csv";
  60. }
  61. echo "all done!";
  62. ?>
  63. </body>
  64. </html>