summaryrefslogtreecommitdiff
path: root/etym.php
blob: 08059fd3f191256bb9bd09a6a680c64eac480ad1 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
<?php

use PHPHtmlParser\Dom;

$baseURL = "http://www.etymonline.com/word/";
$htmlNode = "section[class^='word__defination']";
$pasteCmd = "pastebinit -b http://p.of.je 2>/dev/null";

function readStdin()
{
    $input = fgets(STDIN);

    if ($input === false) {
        echo "No input supplied!\n";
        exit(1);
    }

    $input = rtrim($input, "\n");

    return $input;
}

function cleanUpHtml($input)
{
    // Strip HTML Tags
    $clear = strip_tags($input);
    // Clean up things like &amp;
    $clear = html_entity_decode($clear);
    // Strip out any url-encoded stuff
    $clear = urldecode($clear);
    // Replace Multiple spaces with single space
    $clear = preg_replace('/ +/', ' ', $clear);
    // Trim the string of leading/trailing space
    $clear = trim($clear);
    // Capitalise the first char.
    $clear = ucfirst($clear);

    return $clear;
}

function handleTruncation($input, $definition, $url)
{
    $truncated = $definition;

    $MAX_CHARACTERS = 350;
    if (strlen($truncated) >= $MAX_CHARACTERS) {
        // Create that povjee link.
        // Capitalise the first char of the input.
        $input    = ucfirst($input);
        $defAndUrl        = "\"$input\"" . "\n\n" . $definition . "\n\n" . "[Original at: $url]";
        $safeDef        = escapeshellarg($defAndUrl);

        $pasteBinCmd     = "echo $safeDef | " . $pasteCmd;
        $pasteBinLink    = exec($pasteBinCmd);

        $truncated = substr($truncated, 0, $MAX_CHARACTERS) . "... [More info at $pasteBinLink]";
    }

    return $truncated;
}

function getDefinition()
{

    $input = readStdin();

    $targetURL = $baseURL . $input;

    $dom = new Dom;
    $dom->load($targetURL);
    $html = $dom->find($htmlNode)[0]->innerHtml();
    $node = $html->find($htmlNode, 0);

    if ($node === null) {
        echo "No entry found for '$input'!\n";
        exit(2);
    }

    $definition = cleanUpHtml($node->innertext);
    $definition = handleTruncation($input, $definition, $targetURL);

    echo $definition . "\n";
}

getDefinition();