forked from marshallbrekka/WebBot
-
Notifications
You must be signed in to change notification settings - Fork 0
/
DocumentLoader.php
59 lines (43 loc) · 1011 Bytes
/
DocumentLoader.php
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
<?php
/**
* DocumentLoader
*
* @author Marshall
*/
class DocumentLoader {
private $urls = array();
private $pages = array();
private $internalPointer = 0;
private $directory;
public function addUrls($urls) {
$this->urls = array();
$this->urls = array_merge($this->urls, $urls);
}
public function getNext() {
if($this->internalPointer < size($this->pages)) {
return $this->pages[$this->internalPointer++];
} else {
return false;
}
}
private function loadUrls() {
$this->pages = array();
foreach($this->urls as $url) {
$data = $this->loadWebPage($url);
if($data) {
$this->pages[] = array($url, $data);
}
}
}
private function loadWebPage($url) {
$timeout = 5;
$curlObject = curl_init();
curl_setopt($curlObject, CURLOPT_URL, $url);
curl_setopt($curlObject, CURLOPT_FAILONERROR, true);
curl_setopt($curlObject, CURLOPT_CONNECTTIMEOUT, $timeout);
$data = curl_exec($curlObject);
curl_close($curlObject);
return $data;
}
}
?>