[44] | 1 | <?php
|
---|
| 2 | /**
|
---|
| 3 | * $Id: editor_plugin_src.js 201 2007-02-12 15:56:56Z spocke $
|
---|
| 4 | *
|
---|
| 5 | * @package MCManager.includes
|
---|
| 6 | * @author Moxiecode
|
---|
| 7 | * @copyright Copyright © 2004-2007, Moxiecode Systems AB, All rights reserved.
|
---|
| 8 | */
|
---|
| 9 |
|
---|
| 10 | class GoogleSpell extends SpellChecker {
|
---|
| 11 | /**
|
---|
| 12 | * Spellchecks an array of words.
|
---|
| 13 | *
|
---|
| 14 | * @param {String} $lang Language code like sv or en.
|
---|
| 15 | * @param {Array} $words Array of words to spellcheck.
|
---|
| 16 | * @return {Array} Array of misspelled words.
|
---|
| 17 | */
|
---|
| 18 | function &checkWords($lang, $words) {
|
---|
| 19 | $wordstr = implode(' ', $words);
|
---|
| 20 | $matches = $this->_getMatches($lang, $wordstr);
|
---|
| 21 | $words = array();
|
---|
| 22 |
|
---|
| 23 | for ($i=0; $i<count($matches); $i++)
|
---|
| 24 | $words[] = $this->_unhtmlentities(mb_substr($wordstr, $matches[$i][1], $matches[$i][2], "UTF-8"));
|
---|
| 25 |
|
---|
| 26 | return $words;
|
---|
| 27 | }
|
---|
| 28 |
|
---|
| 29 | /**
|
---|
| 30 | * Returns suggestions of for a specific word.
|
---|
| 31 | *
|
---|
| 32 | * @param {String} $lang Language code like sv or en.
|
---|
| 33 | * @param {String} $word Specific word to get suggestions for.
|
---|
| 34 | * @return {Array} Array of suggestions for the specified word.
|
---|
| 35 | */
|
---|
| 36 | function &getSuggestions($lang, $word) {
|
---|
| 37 | $sug = array();
|
---|
| 38 | $osug = array();
|
---|
| 39 | $matches = $this->_getMatches($lang, $word);
|
---|
| 40 |
|
---|
| 41 | if (count($matches) > 0)
|
---|
| 42 | $sug = explode("\t", utf8_encode($this->_unhtmlentities($matches[0][4])));
|
---|
| 43 |
|
---|
| 44 | // Remove empty
|
---|
| 45 | foreach ($sug as $item) {
|
---|
| 46 | if ($item)
|
---|
| 47 | $osug[] = $item;
|
---|
| 48 | }
|
---|
| 49 |
|
---|
| 50 | return $osug;
|
---|
| 51 | }
|
---|
| 52 |
|
---|
| 53 | function &_getMatches($lang, $str) {
|
---|
| 54 | $server = "www.google.com";
|
---|
| 55 | $port = 443;
|
---|
| 56 | $path = "/tbproxy/spell?lang=" . $lang . "&hl=en";
|
---|
| 57 | $host = "www.google.com";
|
---|
| 58 | $url = "https://" . $server;
|
---|
| 59 |
|
---|
| 60 | // Setup XML request
|
---|
| 61 | $xml = '<?xml version="1.0" encoding="utf-8" ?><spellrequest textalreadyclipped="0" ignoredups="0" ignoredigits="1" ignoreallcaps="1"><text>' . $str . '</text></spellrequest>';
|
---|
| 62 |
|
---|
| 63 | $header = "POST ".$path." HTTP/1.0 \r\n";
|
---|
| 64 | $header .= "MIME-Version: 1.0 \r\n";
|
---|
| 65 | $header .= "Content-type: application/PTI26 \r\n";
|
---|
| 66 | $header .= "Content-length: ".strlen($xml)." \r\n";
|
---|
| 67 | $header .= "Content-transfer-encoding: text \r\n";
|
---|
| 68 | $header .= "Request-number: 1 \r\n";
|
---|
| 69 | $header .= "Document-type: Request \r\n";
|
---|
| 70 | $header .= "Interface-Version: Test 1.4 \r\n";
|
---|
| 71 | $header .= "Connection: close \r\n\r\n";
|
---|
| 72 | $header .= $xml;
|
---|
| 73 |
|
---|
| 74 | // Use curl if it exists
|
---|
| 75 | if (function_exists('curl_init')) {
|
---|
| 76 | // Use curl
|
---|
| 77 | $ch = curl_init();
|
---|
| 78 | curl_setopt($ch, CURLOPT_URL,$url);
|
---|
| 79 | curl_setopt($ch, CURLOPT_RETURNTRANSFER, 1);
|
---|
| 80 | curl_setopt($ch, CURLOPT_CUSTOMREQUEST, $header);
|
---|
| 81 | curl_setopt($ch, CURLOPT_SSL_VERIFYPEER, FALSE);
|
---|
| 82 | $xml = curl_exec($ch);
|
---|
| 83 | curl_close($ch);
|
---|
| 84 | } else {
|
---|
| 85 | // Use raw sockets
|
---|
| 86 | $fp = fsockopen("ssl://" . $server, $port, $errno, $errstr, 30);
|
---|
| 87 | if ($fp) {
|
---|
| 88 | // Send request
|
---|
| 89 | fwrite($fp, $header);
|
---|
| 90 |
|
---|
| 91 | // Read response
|
---|
| 92 | $xml = "";
|
---|
| 93 | while (!feof($fp))
|
---|
| 94 | $xml .= fgets($fp, 128);
|
---|
| 95 |
|
---|
| 96 | fclose($fp);
|
---|
| 97 | } else
|
---|
| 98 | echo "Could not open SSL connection to google.";
|
---|
| 99 | }
|
---|
| 100 |
|
---|
| 101 | // Grab and parse content
|
---|
| 102 | $matches = array();
|
---|
| 103 | preg_match_all('/<c o="([^"]*)" l="([^"]*)" s="([^"]*)">([^<]*)<\/c>/', $xml, $matches, PREG_SET_ORDER);
|
---|
| 104 |
|
---|
| 105 | return $matches;
|
---|
| 106 | }
|
---|
| 107 |
|
---|
| 108 | function _unhtmlentities($string) {
|
---|
| 109 | $string = preg_replace('~&#x([0-9a-f]+);~ei', 'chr(hexdec("\\1"))', $string);
|
---|
| 110 | $string = preg_replace('~&#([0-9]+);~e', 'chr(\\1)', $string);
|
---|
| 111 |
|
---|
| 112 | $trans_tbl = get_html_translation_table(HTML_ENTITIES);
|
---|
| 113 | $trans_tbl = array_flip($trans_tbl);
|
---|
| 114 |
|
---|
| 115 | return strtr($string, $trans_tbl);
|
---|
| 116 | }
|
---|
| 117 | }
|
---|
| 118 |
|
---|
| 119 | // Patch in multibyte support
|
---|
| 120 | if (!function_exists('mb_substr')) {
|
---|
| 121 | function mb_substr($str, $start, $len = '', $encoding="UTF-8"){
|
---|
| 122 | $limit = strlen($str);
|
---|
| 123 |
|
---|
| 124 | for ($s = 0; $start > 0;--$start) {// found the real start
|
---|
| 125 | if ($s >= $limit)
|
---|
| 126 | break;
|
---|
| 127 |
|
---|
| 128 | if ($str[$s] <= "\x7F")
|
---|
| 129 | ++$s;
|
---|
| 130 | else {
|
---|
| 131 | ++$s; // skip length
|
---|
| 132 |
|
---|
| 133 | while ($str[$s] >= "\x80" && $str[$s] <= "\xBF")
|
---|
| 134 | ++$s;
|
---|
| 135 | }
|
---|
| 136 | }
|
---|
| 137 |
|
---|
| 138 | if ($len == '')
|
---|
| 139 | return substr($str, $s);
|
---|
| 140 | else
|
---|
| 141 | for ($e = $s; $len > 0; --$len) {//found the real end
|
---|
| 142 | if ($e >= $limit)
|
---|
| 143 | break;
|
---|
| 144 |
|
---|
| 145 | if ($str[$e] <= "\x7F")
|
---|
| 146 | ++$e;
|
---|
| 147 | else {
|
---|
| 148 | ++$e;//skip length
|
---|
| 149 |
|
---|
| 150 | while ($str[$e] >= "\x80" && $str[$e] <= "\xBF" && $e < $limit)
|
---|
| 151 | ++$e;
|
---|
| 152 | }
|
---|
| 153 | }
|
---|
| 154 |
|
---|
| 155 | return substr($str, $s, $e - $s);
|
---|
| 156 | }
|
---|
| 157 | }
|
---|
| 158 |
|
---|
| 159 | ?> |
---|