From 9cd0234665ea66dff172d94b9c1b4cb61b1d25b1 Mon Sep 17 00:00:00 2001 From: Fbenas Date: Sun, 21 Jun 2020 17:58:23 +0100 Subject: Improve robustness of all scripts and add more to sync command --- app/Console/Commands/ScrapeUrl.php | 40 ++------------------------------------ 1 file changed, 2 insertions(+), 38 deletions(-) (limited to 'app/Console/Commands/ScrapeUrl.php') diff --git a/app/Console/Commands/ScrapeUrl.php b/app/Console/Commands/ScrapeUrl.php index c02080e..06091bf 100644 --- a/app/Console/Commands/ScrapeUrl.php +++ b/app/Console/Commands/ScrapeUrl.php @@ -7,55 +7,19 @@ use Goutte\Client; class ScrapeUrl extends Command { - /** - * The name and signature of the console command. - * - * @var string - */ protected $signature = 'scrape:url { url }'; - - /** - * The console command description. - * - * @var string - */ protected $description = 'Scrape a webpage for data'; - protected $client; - - /** - * Create a new command instance. - * - * @return void - */ - public function __construct() - { - parent::__construct(); - $this->client = new Client(); - } - - /** - * Execute the console command. - * - * @return mixed - */ public function handle() { $url = $this->argument('url'); - if ($url != 'https://www.sixnationsrugby.com/fixtures/') { - $this->error('Url not supported'); - return; - } - - $crawler = $this->client->request('GET', $this->argument('url')); + $crawler = (new Client())->request('GET', $this->argument('url')); - $crawler->filter('div.fixtures__top-tier')->each( + $crawler->filter('title')->each( function ($node) { print $node->text()."\n"; } ); - - } } -- cgit v1.2.3