-
Notifications
You must be signed in to change notification settings - Fork 7
/
CurlClient.php
128 lines (109 loc) · 3.08 KB
/
CurlClient.php
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
<?php
namespace Simgroep\ConcurrentSpiderBundle;
use VDB\Uri\Uri;
class CurlClient
{
/**
* @var resource
*/
protected $ch;
/**
* @var string
*/
protected $userAgent;
/**
* @var string
*/
protected $curlCertCADirectory;
/**
* @param string $userAgent
* @param string $curlCertCADirectory
*/
public function __construct($userAgent, $curlCertCADirectory)
{
$this->userAgent = $userAgent;
$this->curlCertCADirectory = $curlCertCADirectory;
}
public function initClient()
{
$this->ch = curl_init();
$this->setDefaultOptions($this->userAgent, $this->curlCertCADirectory);
}
/**
* @param $userAgent
* @param $curlCertCADirectory
*/
protected function setDefaultOptions($userAgent, $curlCertCADirectory)
{
curl_setopt($this->ch, CURLOPT_HEADER, 0);
curl_setopt($this->ch, CURLOPT_RETURNTRANSFER, 0);
curl_setopt($this->ch, CURLOPT_NOBODY, true);
curl_setopt($this->ch, CURLOPT_CUSTOMREQUEST, 'OPTIONS');
curl_setopt($this->ch, CURLOPT_USERAGENT, $userAgent);
if (!empty($curlCertCADirectory)) {
curl_setopt($this->ch, CURLOPT_SSL_VERIFYPEER, true);
curl_setopt($this->ch, CURLOPT_CAPATH, $curlCertCADirectory);
}
}
/**
* @param Uri $uri
* @return bool
* @throws \Exception
*/
public function isDocument(Uri $uri)
{
curl_setopt($this->ch, CURLOPT_URL, $uri->toString());
$optionsResource = curl_exec($this->ch);
if ($this->getStatusCode() == 301) {
$redirectUrl = $this->getRedirectUrl();
curl_close($this->ch);
throw new \Exception(sprintf(
'Page moved to %s',
$redirectUrl
));
}
$contentType = $this->getContentType();
curl_close($this->ch);
return $this->checkConntentType($contentType);
}
/**
* @return mixed
*/
protected function getStatusCode()
{
return curl_getinfo($this->ch, CURLINFO_HTTP_CODE);
}
/**
* @return mixed
*/
protected function getContentType()
{
return curl_getinfo($this->ch, CURLINFO_CONTENT_TYPE);
}
/**
* @return mixed
*/
protected function getRedirectUrl()
{
return curl_getinfo($this->ch, CURLINFO_REDIRECT_URL);
}
/**
* @param mixed $contentType
* @return bool
*/
protected function checkConntentType($contentType)
{
$contentType = explode(';', $contentType);
switch ($contentType[0]) {
case 'application/pdf':
case 'application/octet-stream' :
case 'application/msword' :
case 'application/vnd.openxmlformats-officedocument.wordprocessingml.document' :
case 'application/vnd.openxmlformats-officedocument.wordprocessingml.template' :
case 'application/rtf' :
case 'application/vnd.oasis.opendocument.text' :
return true;
}
return false;
}
}