summaryrefslogtreecommitdiff
path: root/program/steps/utils/spell_pspell.inc
diff options
context:
space:
mode:
authoralecpl <alec@alec.pl>2010-05-18 10:25:29 +0000
committeralecpl <alec@alec.pl>2010-05-18 10:25:29 +0000
commit677e1f26fe47cc0c3e0819cb99a9024af49a619c (patch)
tree91074d603179889ba7fbde9d080c85ed62b27846 /program/steps/utils/spell_pspell.inc
parentcaccd193c8403913d7c77d65363ff6e4d4269dfb (diff)
- Some files from /bin + spellchecking actions moved to the new 'utils' task
Diffstat (limited to 'program/steps/utils/spell_pspell.inc')
-rw-r--r--program/steps/utils/spell_pspell.inc78
1 files changed, 78 insertions, 0 deletions
diff --git a/program/steps/utils/spell_pspell.inc b/program/steps/utils/spell_pspell.inc
new file mode 100644
index 000000000..f892f8963
--- /dev/null
+++ b/program/steps/utils/spell_pspell.inc
@@ -0,0 +1,78 @@
+<?php
+
+/*
+ +-----------------------------------------------------------------------+
+ | program/steps/utils/spell_pspell.inc |
+ | |
+ | This file is part of the RoundCube Webmail client |
+ | Licensed under the GNU GPL |
+ | |
+ | PURPOSE: |
+ | Use the Pspell extension to check spelling, returns results |
+ | compatible with spell_googie.inc. |
+ | |
+ +-----------------------------------------------------------------------+
+ | Author: Kris Steinhoff <steinhof@umich.edu> |
+ +-----------------------------------------------------------------------+
+
+ $Id$
+
+*/
+
+if (!extension_loaded('pspell')) {
+ raise_error(array(
+ 'code' => 500,
+ 'type' => 'php',
+ 'file' => __FILE__, 'line' => __LINE__,
+ 'message' => "Pspell extension not available"), true, false);
+
+ header('HTTP/1.1 404 Not Found');
+ exit;
+}
+
+// max. number of suggestions for one word
+define('MAX_SUGGESTIONS', 10);
+
+// read input
+$data = file_get_contents('php://input');
+
+// parse data (simplexml_load_string breaks CRLFs)
+$left = strpos($data, '<text>');
+$right = strrpos($data, '</text>');
+$text = substr($data, $left+6, $right-($left+6));
+$text = html_entity_decode($text, ENT_QUOTES, RCMAIL_CHARSET);
+
+// tokenize
+$words = preg_split('/[ !"#$%&()*+\\,\/\n:;<=>?@\[\]^_{|}-]+|\.[^\w]/', $text, NULL, PREG_SPLIT_NO_EMPTY | PREG_SPLIT_OFFSET_CAPTURE );
+
+// init spellchecker
+$plink = pspell_new(get_input_value('lang', RCUBE_INPUT_GET), null, null, RCMAIL_CHARSET, PSPELL_FAST);
+
+// send output
+$out = '<?xml version="1.0" encoding="'.RCMAIL_CHARSET.'"?><spellresult charschecked="'.mb_strlen($text).'">';
+
+$diff = 0;
+foreach ($words as $w) {
+ $word = trim($w[0]);
+ $pos = $w[1] - $diff;
+ $len = mb_strlen($word);
+ if ($word && $plink && preg_match('/[^0-9\.]/', $word)
+ && !pspell_check($plink, $word)) {
+ $suggestions = pspell_suggest($plink, $word);
+ if (sizeof($suggestions)>10)
+ $suggestions = array_slice($suggestions, 0, MAX_SUGGESTIONS);
+
+ $out .= '<c o="'.$pos.'" l="'.$len.'">';
+ $out .= implode("\t", $suggestions);
+ $out .= '</c>';
+ }
+ $diff += (strlen($word) - $len);
+}
+
+$out .= '</spellresult>';
+
+header("Content-Type: text/xml; charset=".RCMAIL_CHARSET);
+echo $out;
+exit;
+
+?>