Home > Article > Backend Development > PHP curl batch processing realizes controllable concurrent and asynchronous operations
This article mainly introduces the controllable concurrency and asynchronous operation of php curl batch processing. It has certain reference value. Now I share it with you. Friends in need can refer to it.
The examples in this article are described PHP curl batch processing implements controllable concurrent asynchronous operations. Share it with everyone for your reference, the details are as follows:
Usually cURL in PHP runs in a blocking manner, which means that after creating a cURL request, you must wait for it to execute successfully or time out before executing the next request: API CURL is generally preferred for interface access. In actual projects or in the process of writing your own gadgets (such as news aggregation, commodity price monitoring, price comparison), you usually need to obtain data from a third-party website or API interface. When processing a URL queue, in order to improve performance, you can use the
curl_multi_* family of functions provided by cURL to achieve simple concurrency. <pre class="brush:php;toolbar:false"><?php
include &#39;curl.class.php&#39;;
function callback($response, $info, $error, $request)
{
echo &#39;response:<br>&#39;;
print_r($response);
echo &#39;<br>&#39; . date("Y-m-d H:i:s") . &#39; <br>&#39;;
echo &#39;<br>&#39; . str_repeat("-", 100) . &#39;<br>&#39;;
}
$USER_COOKIE = (!empty($_REQUEST[&#39;cookie&#39;])) ? $_REQUEST[&#39;cookie&#39;] : file_get_contents("cookie.txt");
$curl = new Curl ("callback");
$data = array(
array(
&#39;url&#39; => &#39;http://dyactive2.vip.xunlei.com/com_sign/?game=qmr&type=rec_gametime&referfrom=&rt=0.42521539455332336&#39;, //秦美人
&#39;method&#39; => &#39;POST&#39;,
&#39;post_data&#39; => &#39;&#39;,
&#39;header&#39; => null,
&#39;options&#39; => array(
CURLOPT_REFERER => "http://niu.xunlei.com/entergame/?gameNo=qmr&fenQuNum=3",
CURLOPT_COOKIE => $USER_COOKIE,
)
),
array(
&#39;url&#39; => &#39;http://dyactive2.vip.xunlei.com/com_sign/?game=sq&type=rec_gametime&referfrom=&rt=0.42521539455332336&#39;, //神曲
&#39;method&#39; => &#39;POST&#39;,
&#39;post_data&#39; => &#39;&#39;,
&#39;header&#39; => null,
&#39;options&#39; => array(
CURLOPT_REFERER => "http://niu.xunlei.com/entergame/?gameNo=sq&fenQuNum=41",
CURLOPT_COOKIE => $USER_COOKIE,
)
),
array(
&#39;url&#39; => &#39;http://dyactive2.vip.xunlei.com/com_sign/?game=frxz&type=rec_gametime&referfrom=&rt=0.42521539455332336&#39;, //凡人修真
&#39;method&#39; => &#39;POST&#39;,
&#39;post_data&#39; => &#39;&#39;,
&#39;header&#39; => null,
&#39;options&#39; => array(
CURLOPT_REFERER => "http://niu.xunlei.com/entergame/?gameNo=frxz&fenQuNum=3",
CURLOPT_COOKIE => $USER_COOKIE,
)
),
array(
&#39;url&#39; => &#39;http://dyactive2.vip.xunlei.com/com_sign/?game=smxj&type=rec_gametime&referfrom=&rt=0.42521539455332336&#39;, //神魔仙界
&#39;method&#39; => &#39;POST&#39;,
&#39;post_data&#39; => &#39;&#39;,
&#39;header&#39; => null,
&#39;options&#39; => array(
CURLOPT_REFERER => "http://niu.xunlei.com/entergame/?gameNo=smxj&fenQuNum=2",
CURLOPT_COOKIE => $USER_COOKIE,
)
),
array(
&#39;url&#39; => &#39;http://dyactive2.vip.xunlei.com/com_sign/?game=qsqy&type=rec_gametime&referfrom=&rt=0.42521539455332336&#39;, //倾世情缘
&#39;method&#39; => &#39;POST&#39;,
&#39;post_data&#39; => &#39;&#39;,
&#39;header&#39; => null,
&#39;options&#39; => array(
CURLOPT_REFERER => "http://niu.xunlei.com/entergame/?gameNo=qsqy&fenQuNum=11",
CURLOPT_COOKIE => $USER_COOKIE,
)
),
);
foreach ($data as $val) {
$request = new Curl_request ($val [&#39;url&#39;], $val [&#39;method&#39;], $val [&#39;post_data&#39;], $val [&#39;header&#39;], $val [&#39;options&#39;]);
$curl->add($request);
}
$curl->execute();
echo $curl->display_errors();</pre>
The effect is very good, there are no side effects, and the number of concurrency can be Control, there are many applications, use your imagination
<?php /** * cURL批量处理 工具类 * * @since Version 1.0 * @author Justmepzy <justmepzy@gmail.com> * @link http://t.qq.com/JustPzy */ /** *单一的请求对象 */ class Curl_request { public $url = ''; public $method = 'GET'; public $post_data = null; public $headers = null; public $options = null; /** * * @param string $url * @param string $method * @param string $post_data * @param string $headers * @param array $options * @return void */ public function __construct($url, $method = 'GET', $post_data = null, $headers = null, $options = null) { $this->url = $url; $this->method = strtoupper( $method ); $this->post_data = $post_data; $this->headers = $headers; $this->options = $options; } /** * @return void */ public function __destruct() { unset ( $this->url, $this->method, $this->post_data, $this->headers, $this->options ); } } /** * 包含请求列队处理 */ class Curl { /** * 请求url个数 * @var int */ private $size = 5; /** * 等待所有cURL批处理中的活动连接等待响应时间 * @var int */ private $timeout = 5; /** * 完成请求回调函数 * @var string */ private $callback = null; /** * cRUL配置 * @var array */ private $options = array (CURLOPT_SSL_VERIFYPEER => 0,CURLOPT_RETURNTRANSFER => 1,CURLOPT_CONNECTTIMEOUT => 30 ); /** * 请求头 * @var array */ private $headers = array (); /** * 请求列队 * @var array */ private $requests = array (); /** * 请求列队索引 * @var array */ private $request_map = array (); /** * 错误 * @var array */ private $errors = array (); /** * @access public * @param string $callback 回调函数 * 该函数有4个参数($response,$info,$error,$request) * $response url返回的body * $info cURL连接资源句柄的信息 * $error 错误 * $request 请求对象 */ public function __construct($callback = null) { $this->callback = $callback; } /** * 添加一个请求对象到列队 * @access public * @param object $request * @return boolean */ public function add($request) { $this->requests [] = $request; return TRUE; } /** * 创建一个请求对象并添加到列队 * @access public * @param string $url * @param string $method * @param string $post_data * @param string $headers * @param array $options * @return boolean */ public function request($url, $method = 'GET', $post_data = null, $headers = null, $options = null) { $this->requests [] = new Curl_request ( $url, $method, $post_data, $headers, $options ); return TRUE; } /** * 创建GET请求对象 * @access public * @param string $url * @param string $headers * @param array $options * @return boolean */ public function get($url, $headers = null, $options = null) { return $this->request ( $url, "GET", null, $headers, $options ); } /** * 创建一个POST请求对象 * @access public * @param string $url * @param string $post_data * @param string $headers * @param array $options * @return boolean */ public function post($url, $post_data = null, $headers = null, $options = null) { return $this->request ( $url, "POST", $post_data, $headers, $options ); } /** * 执行cURL * @access public * @param int $size 最大连接数 * @return Ambigous <boolean, mixed>|boolean */ public function execute($size = null) { if (sizeof ( $this->requests ) == 1) { return $this->single_curl (); } else { return $this->rolling_curl ( $size ); } } /** * 单个url请求 * @access private * @return mixed|boolean */ private function single_curl() { $ch = curl_init (); $request = array_shift ( $this->requests ); $options = $this->get_options ( $request ); curl_setopt_array ( $ch, $options ); $output = curl_exec ( $ch ); $info = curl_getinfo ( $ch ); // it's not neccesary to set a callback for one-off requests if ($this->callback) { $callback = $this->callback; if (is_callable ( $this->callback )) { call_user_func ( $callback, $output, $info, $request ); } } else return $output; return true; } /** * 多个url请求 * @access private * @param int $size 最大连接数 * @return boolean */ private function rolling_curl($size = null) { if ($size) $this->size = $size; else $this->size = count($this->requests); if (sizeof ( $this->requests ) < $this->size) $this->size = sizeof ( $this->requests ); if ($this->size < 2) $this->set_error ( 'size must be greater than 1' ); $master = curl_multi_init (); //添加cURL连接资源句柄到map索引 for($i = 0; $i < $this->size; $i ++) { $ch = curl_init (); $options = $this->get_options ( $this->requests [$i] ); curl_setopt_array ( $ch, $options ); curl_multi_add_handle ( $master, $ch ); $key = ( string ) $ch; $this->request_map [$key] = $i; } $active = $done = null; do { while ( ($execrun = curl_multi_exec ( $master, $active )) == CURLM_CALL_MULTI_PERFORM ) ; if ($execrun != CURLM_OK) break; //有一个请求完成则回调 while ( $done = curl_multi_info_read ( $master ) ) { //$done 完成的请求句柄 $info = curl_getinfo ( $done ['handle'] );// $output = curl_multi_getcontent ( $done ['handle'] );// $error = curl_error ( $done ['handle'] );// $this->set_error ( $error ); //调用回调函数,如果存在的话 $callback = $this->callback; if (is_callable ( $callback )) { $key = ( string ) $done ['handle']; $request = $this->requests [$this->request_map [$key]]; unset ( $this->request_map [$key] ); call_user_func ( $callback, $output, $info, $error, $request ); } curl_close ( $done ['handle'] ); //从列队中移除已经完成的request curl_multi_remove_handle ( $master, $done ['handle'] ); } //等待所有cURL批处理中的活动连接 if ($active) curl_multi_select ( $master, $this->timeout ); } while ( $active ); //完成关闭 curl_multi_close ( $master ); return true; } /** * 获取没得请求对象的cURL配置 * @access private * @param object $request * @return array */ private function get_options($request) { $options = $this->__get ( 'options' ); if (ini_get ( 'safe_mode' ) == 'Off' || ! ini_get ( 'safe_mode' )) { $options [CURLOPT_FOLLOWLOCATION] = 1; $options [CURLOPT_MAXREDIRS] = 5; } $headers = $this->__get ( 'headers' ); if ($request->options) { $options = $request->options + $options; } $options [CURLOPT_URL] = $request->url; if ($request->post_data && strtolower($request->method) == 'post' ) { $options [CURLOPT_POST] = 1; $options [CURLOPT_POSTFIELDS] = $request->post_data; } if ($headers) { $options [CURLOPT_HEADER] = 0; $options [CURLOPT_HTTPHEADER] = $headers; } return $options; } /** * 设置错误信息 * @access public * @param string $msg */ public function set_error($msg) { if (! empty ( $msg )) $this->errors [] = $msg; } /** * 获取错误信息 * @access public * @param string $open * @param string $close * @return string */ public function display_errors($open = '<p>', $close = '</p>') { $str = ''; foreach ( $this->errors as $val ) { $str .= $open . $val . $close; } return $str; } /** * @access public * @param string $name * @param string $value * @return boolean */ public function __set($name, $value) { if ($name == 'options' || $name == 'headers') { $this->{$name} = $value + $this->{$name}; } else { $this->{$name} = $value; } return TRUE; } /** * * @param string $name * @return mixed * @access public */ public function __get($name) { return (isset ( $this->{$name} )) ? $this->{$name} : null; } /** * @return void * @access public */ public function __destruct() { unset ( $this->size, $this->timeout, $this->callback, $this->options, $this->headers, $this->requests, $this->request_map, $this->errors ); } } // END Curl Class /* End of file curl.class.php */
The above is the entire content of this article, please pay attention to the PHP Chinese website for more related content.
Related recommendations:
php curl sends a fake requestphp CURL obtains cookies to simulate login method code exampleThe above is the detailed content of PHP curl batch processing realizes controllable concurrent and asynchronous operations. For more information, please follow other related articles on the PHP Chinese website!