diff options
-rw-r--r-- | src/Curl.php | 48 | ||||
-rw-r--r-- | src/Etym.php | 3 |
2 files changed, 50 insertions, 1 deletions
diff --git a/src/Curl.php b/src/Curl.php new file mode 100644 index 0000000..61acaa0 --- /dev/null +++ b/src/Curl.php @@ -0,0 +1,48 @@ +<?php + +namespace App; + +use PHPHtmlParser\Exceptions\CurlException; +use PHPHtmlParser\CurlInterface; + +/** + * Class Curl + * + * @package PHPHtmlParser + */ +class Curl implements CurlInterface +{ + + /** + * A simple curl implementation to get the content of the url. + * + * @param string $url + * @return string + * @throws CurlException + */ + public function get(string $url): string + { + $ch = curl_init($url); + + if (! ini_get('open_basedir')) { + curl_setopt($ch, CURLOPT_FOLLOWLOCATION, true); + } + + curl_setopt($ch, CURLOPT_RETURNTRANSFER, true); + curl_setopt($ch, CURLOPT_CONNECTTIMEOUT, 5); + curl_setopt($ch, CURLOPT_SSL_VERIFYPEER, false); + // curl_setopt($ch, CURLOPT_VERBOSE, true); + curl_setopt($ch, CURLOPT_RETURNTRANSFER, true); + curl_setopt($ch, CURLOPT_USERAGENT, 'Mozilla/5.0 (X11; Linux x86_64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/52.0.2743.116 Safari/537.36'); + curl_setopt($ch, CURLOPT_URL, $url); + + $content = curl_exec($ch); + if ($content === false) { + // there was a problem + $error = curl_error($ch); + throw new CurlException('Error retrieving "'.$url.'" ('.$error.')'); + } + + return $content; + } +} diff --git a/src/Etym.php b/src/Etym.php index 1098021..10e22d7 100644 --- a/src/Etym.php +++ b/src/Etym.php @@ -2,6 +2,7 @@ namespace App; +use App\Curl; use PHPHtmlParser\Dom; /** @@ -43,7 +44,7 @@ class Etym $targetURL = $this->baseURL . $input; $dom = new Dom; - $dom->load($targetURL); + $dom->loadFromUrl($targetURL, [], new Curl); $html = $dom->find($this->domSearch); if (!$html instanceof \PHPHtmlParser\Dom\Collection || count($html) <= 0) { |