Example #1
0
 /**
  * Mendownload $size buah link sekaligus, lalu diproses oleh fungsi $function
  * @param integer $size jumlah thread yg diinginkan
  * @param array   $pages_url array of full url
  * @param string  $function nama fungsi yang dipanggil untuk memproses 1 halaman,
  *                  fungsinya minimal punya 1 parameter (Page $P)
  * @param array   $params parameter tambahan ke fungsi
  */
 public static function multiProcess($size, $pages_url, $function, $params = false)
 {
     $n = 0;
     $curlHandle = null;
     $curlList = array();
     foreach ($pages_url as $aurl) {
         if ($n == 0) {
             $curlHandle = curl_multi_init();
         }
         $curlList[$aurl] = self::addHandle($curlHandle, $aurl);
         $n++;
         if ($n >= $size) {
             self::execHandle($curlHandle);
             foreach ($curlList as $theurl => $curlEl) {
                 $html = curl_multi_getcontent($curlEl);
                 // Ada kemungkinan gagal retrieve
                 if (trim($html)) {
                     $P = new Page();
                     $P->fetch_text($html);
                 } else {
                     $P = new Page($theurl);
                 }
                 if ($params) {
                     call_user_func_array($function, array_merge(array($P), $params));
                 } else {
                     $function($P);
                 }
                 curl_multi_remove_handle($curlHandle, $curlEl);
             }
             curl_multi_close($curlHandle);
             $n = 0;
             $curlList = array();
         }
     }
     if ($curlList) {
         self::execHandle($curlHandle);
         foreach ($curlList as $theurl => $curlEl) {
             $html = curl_multi_getcontent($curlEl);
             // Ada kemungkinan gagal retrieve
             if (trim($html)) {
                 $P = new Page();
                 $P->fetch_text($html);
             } else {
                 $P = new Page($theurl);
             }
             if ($params) {
                 call_user_func_array($function, array_merge(array($P), $params));
             } else {
                 $function($P);
             }
             curl_multi_remove_handle($curlHandle, $curlEl);
         }
         curl_multi_close($curlHandle);
     }
 }
Example #2
0
function coursera()
{
    $p = new Page();
    $p->fetch_text(file_get_contents('D:\\temp\\Design and Analysis of Algorithms I\\coursera.dump.htm'));
    $p->go_line('class="item_list"');
    do {
        if ($p->curr_line()->contain('<li')) {
            $title = $p->next_line()->to_s();
        } else {
            if ($p->curr_line()->contain('download.mp4')) {
                $href = $p->curr_line()->dup()->cut_between('href="', '"')->to_s();
                echo "<a href='{$href}'>{$title}</a><br />\n";
            }
        }
    } while (!$p->next_line()->contain('<script>'));
}