国产探花免费观看_亚洲丰满少妇自慰呻吟_97日韩有码在线_资源在线日韩欧美_一区二区精品毛片,辰东完美世界有声小说,欢乐颂第一季,yy玄幻小说排行榜完本

首頁 > 編程 > PHP > 正文

PHP制作百度詞典查詞采集器

2020-03-22 19:28:02
字體:
來源:轉載
供稿:網友
百度dict 采集樣本寫的采集百度dict詞典翻譯后的所有結果數據,當然附帶了13.5w單詞庫和采集簡單的案例,這里我把寫出的主要類dict.html' target='_blank'>class.php放出來,項目地址http://github.com/widuu/baidu_dict,有需要的直接fork就可以了~么么噠,這東西用的人很少,所以有用的兄弟拿走了哈~ * dict.class.php 采集百度詞典翻譯內容 * @copyright (C) 2014 widuu * @license http://www.widuu.com * @lastmodify 2014-2-15
private function getContent(){ $useragent = "Mozilla/5.0 (Windows NT 6.1; WOW64; rv:23.0) Gecko/20100101 Firefox/23.0"; $ch = curl_init(); $url = "http://dict.baidu.com/s wd=".$this- word; curl_setopt($ch, CURLOPT_URL, $url); curl_setopt($ch, CURLOPT_USERAGENT,$useragent); curl_setopt($ch, CURLOPT_RETURNTRANSFER, TRUE); curl_setopt($ch, CURLOPT_FOLLOWLOCATION, 1); curl_setopt($ch, CURLOPT_HTTPGET, 1); curl_setopt($ch, CURLOPT_AUTOREFERER,1); curl_setopt($ch, CURLOPT_HEADER, 0); curl_setopt($ch, CURLOPT_TIMEOUT, 30); $result = curl_exec($ch); if (curl_errno($curl)) { echo 'Errno'.curl_error($curl); curl_close($ch); return $result;
$data = $this - getContent(); preg_match_all("http://"EN/-US/"/ (.*)/ //b/ /Ui",$data,$pronounced); return array( 'en' = $pronounced[1][0], 'us' = $pronounced[1][1] * 獲取百度翻譯發音 * return array(英,美) private function getSay(){ $data = $this - getContent(); preg_match_all("/url=/"(.*)/"/Ui",$data,$pronounced); return array( 'en' = $pronounced[1][0], 'us' = $pronounced[1][1] * 獲取百度翻譯例句 * return array() 多維數組 例句 private function getExample(){ $str = ""; $data = $this - getContent(); preg_match_all("/var example_data = (.*)/]/;/Us",$data,$example); $data1 = "[[[".ltrim($example[1][0],"["); $data2 = explode("[[[",$data1); $num = count(array_filter($data2)); foreach($data2 as $key = $value){ $data3 = explode("[[","[[".$value); foreach ($data3 as $k = $v) { preg_match_all("http://[/"(.*)/",/Us","[".$v, $match); if(!empty($match[1])){ $str .= implode($match[1]," ")."@"; $data4 = trim($str,"@"); $data5 = explode("@", $data4); $result = array_chunk($data5, 2); return $result; * 獲取簡明釋義 * return array (x = "詞性",b = "附屬") private function getExplain(){ $data = $this - getContent(); preg_match_all("/id/=/"en/-simple/-means/"/ (.*)/ div(/s+)class/=/"source/"/ /Us",$data,$explain); $r_data = $explain[1][0]; preg_match_all("http:// p/ / strong/ ( P adj .*)/ //strong/ / span/ ( P name .*)/ //span/ / //p/ /Us", $r_data, $a_data); preg_match_all("http:// span/ ( P tag [^/ ]+)/:/ a(/s+)href/=/"(.*)/"/ ( P word .*)/ //a/ / //span/ /Us", $r_data, $b_data); $result = array(); foreach ($a_data["adj"] as $key = $value) { $result[$value] = $a_data["name"][$key]; $word_b = array(); foreach ($b_data["tag"] as $key = $value) { $word_b[$value] = strip_tags($b_data["word"][$key]); $result_data = array("x" = $result,"b" = $word_b); return $result_data;
$data = $this - getContent(); preg_match_all("/id=/"en/-syn/-ant/"/ (.*) div(/s+)class/=/"source/" /Us",$data,$synonym); $content = $synonym[1][0]; $data1 = explode(" /dl ", $content); $result = array(); $data2 = array(); foreach ($data1 as $key = $value) { preg_match_all("http:// strong/ ( P adj .*)/ / //strong/ / //div/ / div(/s+)class/=/"syn/-ant/-list/"/ / ul/ ( content .*)/ //ul/ /Us", $value, $r_data); $data2[$key]["adj"] = $r_data["adj"]; $data2[$key]["content"] = $r_data["content"]; foreach ($data2 as $key = $value) { foreach ($value["content"] as $k = $v) { if(!empty($v)){ preg_match_all("http:// li/ / p/ ( P title .*)/ //p/ ( P value .*)/ //li /Us", $v, $v_data); foreach ($v_data['title'] as $m = $d) { $data = strip_tags(preg_replace(" /a "," ", $v_data["value"][$m])); $result[$key][$value["adj"][$k]][$d] = $data; return $result; * 獲取短語詞組 * return array (key = value) 一維或者多維數組 private function getPhrase(){ $num = self::$num; $data = $this - getContent(); preg_match_all("/id=/"en/-phrase/"/ (.*)/ div class/=/"source/"/ /Us",$data,$phrase); $data = explode(" /dd ",$phrase[1][0]); $data1 = array_slice($data,0,$num); $result = array(); foreach ($data1 as $key = $value) { $data2 = explode(" /p ", $value); $n = count($data2); if($n =3){ $result[str_replace("","",strip_tags($data2[0]))] = strip_tags($data2[1]); }else{ $data3 = array_slice($data2,0,$n-1); $data4 = array_slice($data2,0,2); $res = array_diff($data3,$data4); $data5 = array_chunk($res,2); $key_value = trim(str_replace("","",strip_tags($data4[0]))); $result[$key_value] = strip_tags($data4[1]); foreach ($data5 as $key = $value) { foreach ($value as $k = $v) { $value[$k] = strip_tags($v); $array = array($result[$key_value],$value); if (array_key_exists($key_value, $result)){ $result[$key_value] = $array; return $result; * 將數組轉換為字符串 * @param array $data 數組 * @param bool $isformdata 如果為0,則不使用new_stripslashes處理,可選參數,默認為1 * @return string 返回字符串,如果,data為空,則返回空 private function array2string($data, $isformdata = 1) { if($data == '') return ''; if($isformdata) $data = $this- new_stripslashes($data); return addslashes(var_export($data, TRUE)); * 返回經stripslashes處理過的字符串或數組 * @param $string 需要處理的字符串或數組 * @return mixed private function new_stripslashes($string) { if(!is_array($string)) return stripslashes($string); foreach($string as $key = $val) $string[$key] = $this- new_stripslashes($val); return $string;// $word = new dict("express");// $word - content();以上就是本文的全部內容了,非常實用的功能,希望小伙伴們能夠喜歡。PHP教程

鄭重聲明:本文版權歸原作者所有,轉載文章僅為傳播更多信息之目的,如作者信息標記有誤,請第一時間聯系我們修改或刪除,多謝。

發表評論 共有條評論
用戶名: 密碼:
驗證碼: 匿名發表
主站蜘蛛池模板: 饶河县| 醴陵市| 秦皇岛市| 行唐县| 金溪县| 应用必备| 东方市| 宁都县| 宜昌市| 临沧市| 关岭| 华安县| 溧阳市| 连江县| 天水市| 湟源县| 昆明市| 平原县| 丹巴县| 沿河| 大英县| 扶沟县| 新丰县| 贡山| 郴州市| 临沂市| 达日县| 合江县| 焦作市| 大冶市| 旬阳县| 泽普县| 中山市| 云梦县| 静乐县| 资阳市| 富平县| 云林县| 延边| 岑巩县| 安塞县|