轉自:http://blog.csdn.net/think2me/article/details/12999907
1. 說說csv 和 Excel
這兩者都是我們平時導出或者導入數據一般用到的載體。兩者有什么區別呢?csv 格式更兼容一點。那么共同點都是GBK格式的,非UTF8。所以我們上傳文件的時候,老是出現亂碼,就是編碼問題沒有轉好導致。
2. 推薦的幾種方法
1. 函數 fgetss($handel); 返回字符串。它就是strip_tags(fget($handel))的組合讀取csv 文件的一行。去掉了其中的HTML,php 等標簽。這種方法使用於小的csv 文件
- $handle=fopen("1.csv","r");
- while(!feof($handle)){
- $buffer=fgetss($handle,2048);
- $row = mb_convert_encoding(trim($buffer), 'utf-8', 'gbk'); //很重要。轉換成UTF8格式,不然容易產生亂碼
- $data=explode(",",$row); //轉換成數組
- $insertRows[] = $data;
- } //這樣所有的csv文件就生成一個二維數組$insertRows;
2. 函數 fgetcsv($handel,2048,','),返回數組,它就是explode(",",fget($handel))的組合。這種方法使用於小的csv 文件。而且不適合有漢字的csv 文件。
- $handle=fopen("1.csv","r");
- while($data=fgetcsv($handle,1000,",")){
- $insertRows[] = $data;
- } //這樣所有的csv文件就生成一個二維數組$insertRows;
- $handle=fopen("1.csv","r");
- //將文件一次性全部讀出來
- $excelData = array();
- $content = trim(file_get_contents($fileName));
- $excelData = explode("\n",$content);
或者直接用$excelData = file($file); file() 函數直接將數據讀出並放入數組當中。
我們先將所有的文件一次性讀出來。放到一個數組$excelData 中。這個時候,我們就可以不用管這個csv 文件了,純粹了php 操作數組了。所以。不會崩潰異常:
- $chunkData = array_chunk($excelData , 5000); // 將這個10W+ 的數組分割成5000一個的小數組。這樣就一次批量插入5000條數據。mysql 是支持的。
- $count = count($chunkData);
- for ($i = 0; $i < $count; $i++) {
- $insertRows = array();
- foreach($chunkData[$i] as $value){
- $string = mb_convert_encoding(trim(strip_tags($value)), 'utf-8', 'gbk');//轉碼
- $v = explode(',', trim($string));
- $row = array();
- $row['cdate'] = empty($v[0]) ? date('Y-m-d') : date('Y-m-d',strtotime($v[0]));
- $row['business'] = $v[1];
- $row['project'] = $v[2];
- $row['shopname'] = $v[3];
- $row['shopid'] = $v[4];
- $row['fanli'] = formatNumber($v[5]);
- $row['fb'] = $v[6] * 100;
- $row['jifen'] = $v[7];
- $sqlString = '('."'".implode( "','", $row ) . "'".')'; //批量
- $insertRows[] = $sqlString;
- }
- $result = $model->addDetail($insertRows); //批量將sql插入數據庫。
- }
插入數據庫當然是批量插入了:
- public function addDetail($rows){
- if(empty($rows)){
- return false;
- }
- //數據量較大,采取批量插入
- $data = implode(',', $rows);
- $sql = "INSERT IGNORE INTO tb_account_detail(cdate,business,project,shopname,shopid,fanli,fb,jifen)
- VALUES {$data}";
- $result = $this->query($sql);
- return true;
- }
ok ! 親測試。10W 數據。6個字段。插入需要10秒。
-----------------2013-12-18 日更新---------------------
3. 導出10W+的數據到csv
放棄之前寫的一篇博客中用到的方法:http://blog.csdn.net/think2me/article/details/8596833 。原因是:當超過50W+ 以上的數據時,有可能瀏覽器崩潰,內存超。
這個方法是寫文件的方式。然后再把文件彈出下載。
- public function dump2Excel() {
- set_time_limit(0);
- ini_set('memory_limit', '640M');
- //獲取列表
- $name = $this->getActionName();
- $model = D(GROUP_NAME . '.' . $name);
- $map = $this->_search();
- //文件名
- if (isset($_GET['error']) && $_GET['error'] > 0) {
- $filename = C('IMG_PATH').'account_data_error_' . $map['action_id'] . '_' . date('Y-m-d', mktime()) . '.csv';
- }else{
- $filename = C('IMG_PATH').'account_data_all_' . $map['action_id'] . '_' . date('Y-m-d', mktime()) . '.csv';
- }
- //用戶信息,商家ID,聯盟,商家訂單號,商品分類,確認類別,下單時間,完成時間,
- //實際支付金額,佣金,佣金補貼,返利,F幣,論壇積分,備注,強制入庫
- // 'user_info', 'shopid', 'league', 'order_id', 'classify', 'confirm_type',
- //'buydate', 'paydate', 'real_pay', 'commission', 'commission_plus',
- // 'fanli', 'jifen', 'bbs', 'remarks', 'persist_execute', 'unique_sign','error_code'
- $header[] = iconv("utf-8", "gb2312", "用戶信息");
- $header[] = iconv("utf-8", "gb2312", "商家ID");
- $header[] = iconv("utf-8", "gb2312", "聯盟");
- $header[] = iconv("utf-8", "gb2312", "商家訂單號");
- $header[] = iconv("utf-8", "gb2312", "商品分類");
- $header[] = iconv("utf-8", "gb2312", "確認類別");
- $header[] = iconv("utf-8", "gb2312", "下單時間");
- $header[] = iconv("utf-8", "gb2312", "完成時間");
- $header[] = iconv("utf-8", "gb2312", "實際支付金額");
- $header[] = iconv("utf-8", "gb2312", "佣金");
- $header[] = iconv("utf-8", "gb2312", "佣金補貼");
- $header[] = iconv("utf-8", "gb2312", "返利");
- $header[] = iconv("utf-8", "gb2312", "F幣");
- $header[] = iconv("utf-8", "gb2312", "論壇積分");
- $header[] = iconv("utf-8", "gb2312", "備注");
- $header[] = iconv("utf-8", "gb2312", "強制入庫");
- $header[] = iconv("utf-8", "gb2312", "唯一標識");
- $header[] = iconv("utf-8", "gb2312", "錯誤信息");
- $headerFile = implode(',', $header);
- //寫入標題
- @unlink($filename);
- file_put_contents($filename, $headerFile."\n");
- //獲取所有error_code
- $list = D('Fanli')->table('tb_account_action_data_error_code')->field('id,err_msg')->findAll();
- $error_msg = array();
- foreach ($list as $value) {
- $error_msg[$value['id']] = $value['err_msg'];
- }
- //導入錯誤的數據
- if (isset($_GET['error']) && $_GET['error'] > 0) {
- $map['error_code'] = array('gt', 0);
- }
- if (!empty($map['action_id'])) {
- $allCount = $model->where($map)->field('count(1) as count')->select();
- $pageLimit = ceil($allCount[0]['count']/self::PAGE_COUNT);
- $voList = array();
- //打開文件
- if (!$handle = fopen($filename, 'a')) {
- echo "不能打開文件 $filename";
- exit;
- }
- //分頁獲取
- for($i=0;$i<$pageLimit;$i++){
- $count = self::PAGE_COUNT;
- $start = $count * $i;
- $limit = "$start,$count";
- $voList = $model->where($map)->limit($limit)->order('id desc')->findAll();
- //寫入文件
- $excelString = array();
- foreach ($voList as $v) {
- $dumpExcel = array();
- $dumpExcel[] = mb_convert_encoding($v['user_info'], 'GBK', 'UTF-8');
- $dumpExcel[] = mb_convert_encoding($v['shopid'], 'GBK', 'UTF-8');
- $dumpExcel[] = mb_convert_encoding($v['league'], 'GBK', 'UTF-8');
- $dumpExcel[] = mb_convert_encoding($v['order_id'], 'GBK', 'UTF-8');
- $dumpExcel[] = mb_convert_encoding($v['classify'], 'GBK', 'UTF-8');
- $dumpExcel[] = mb_convert_encoding($v['confirm_type'], 'GBK', 'UTF-8');
- $dumpExcel[] = "'".mb_convert_encoding($v['buydate'], 'GBK', 'UTF-8');
- $dumpExcel[] = "'".mb_convert_encoding($v['paydate'], 'GBK', 'UTF-8');
- $dumpExcel[] = mb_convert_encoding($v['real_pay'], 'GBK', 'UTF-8');
- $dumpExcel[] = mb_convert_encoding($v['commission'], 'GBK', 'UTF-8');
- $dumpExcel[] = mb_convert_encoding($v['commission_plus'], 'GBK', 'UTF-8');
- $dumpExcel[] = mb_convert_encoding($v['fanli'], 'GBK', 'UTF-8');
- $dumpExcel[] = mb_convert_encoding($v['jifen'], 'GBK', 'UTF-8');
- $dumpExcel[] = mb_convert_encoding($v['bbs'], 'GBK', 'UTF-8');
- $dumpExcel[] = mb_convert_encoding($v['remarks'], 'GBK', 'UTF-8');
- $dumpExcel[] = intval($v['persist_execute']);
- $dumpExcel[] = mb_convert_encoding($v['unique_sign'], 'GBK', 'UTF-8');
- $dumpExcel[] = mb_convert_encoding($error_msg[$v['error_code']], 'GBK', 'UTF-8');
- $excelString[] = implode(',',$dumpExcel);
- }
- //只能一行行些。不然容易漏
- foreach($excelString as $content){
- fwrite($handle, $content . "\n");
- }
- unset($excelString);
- }
- fclose($handle);
- }
- //導出下載
- header("Content-type: application/octet-stream");
- header('Content-Disposition: attachment; filename="' . basename($filename) . '"');
- header("Content-Length: ". filesize($filename));
- readfile($filename);
- }
