diff options
author | alecpl <alec@alec.pl> | 2010-05-18 10:25:29 +0000 |
---|---|---|
committer | alecpl <alec@alec.pl> | 2010-05-18 10:25:29 +0000 |
commit | 677e1f26fe47cc0c3e0819cb99a9024af49a619c (patch) | |
tree | 91074d603179889ba7fbde9d080c85ed62b27846 /program/steps/utils/spell_pspell.inc | |
parent | caccd193c8403913d7c77d65363ff6e4d4269dfb (diff) |
- Some files from /bin + spellchecking actions moved to the new 'utils' task
Diffstat (limited to 'program/steps/utils/spell_pspell.inc')
-rw-r--r-- | program/steps/utils/spell_pspell.inc | 78 |
1 files changed, 78 insertions, 0 deletions
diff --git a/program/steps/utils/spell_pspell.inc b/program/steps/utils/spell_pspell.inc new file mode 100644 index 000000000..f892f8963 --- /dev/null +++ b/program/steps/utils/spell_pspell.inc @@ -0,0 +1,78 @@ +<?php + +/* + +-----------------------------------------------------------------------+ + | program/steps/utils/spell_pspell.inc | + | | + | This file is part of the RoundCube Webmail client | + | Licensed under the GNU GPL | + | | + | PURPOSE: | + | Use the Pspell extension to check spelling, returns results | + | compatible with spell_googie.inc. | + | | + +-----------------------------------------------------------------------+ + | Author: Kris Steinhoff <steinhof@umich.edu> | + +-----------------------------------------------------------------------+ + + $Id$ + +*/ + +if (!extension_loaded('pspell')) { + raise_error(array( + 'code' => 500, + 'type' => 'php', + 'file' => __FILE__, 'line' => __LINE__, + 'message' => "Pspell extension not available"), true, false); + + header('HTTP/1.1 404 Not Found'); + exit; +} + +// max. number of suggestions for one word +define('MAX_SUGGESTIONS', 10); + +// read input +$data = file_get_contents('php://input'); + +// parse data (simplexml_load_string breaks CRLFs) +$left = strpos($data, '<text>'); +$right = strrpos($data, '</text>'); +$text = substr($data, $left+6, $right-($left+6)); +$text = html_entity_decode($text, ENT_QUOTES, RCMAIL_CHARSET); + +// tokenize +$words = preg_split('/[ !"#$%&()*+\\,\/\n:;<=>?@\[\]^_{|}-]+|\.[^\w]/', $text, NULL, PREG_SPLIT_NO_EMPTY | PREG_SPLIT_OFFSET_CAPTURE ); + +// init spellchecker +$plink = pspell_new(get_input_value('lang', RCUBE_INPUT_GET), null, null, RCMAIL_CHARSET, PSPELL_FAST); + +// send output +$out = '<?xml version="1.0" encoding="'.RCMAIL_CHARSET.'"?><spellresult charschecked="'.mb_strlen($text).'">'; + +$diff = 0; +foreach ($words as $w) { + $word = trim($w[0]); + $pos = $w[1] - $diff; + $len = mb_strlen($word); + if ($word && $plink && preg_match('/[^0-9\.]/', $word) + && !pspell_check($plink, $word)) { + $suggestions = pspell_suggest($plink, $word); + if (sizeof($suggestions)>10) + $suggestions = array_slice($suggestions, 0, MAX_SUGGESTIONS); + + $out .= '<c o="'.$pos.'" l="'.$len.'">'; + $out .= implode("\t", $suggestions); + $out .= '</c>'; + } + $diff += (strlen($word) - $len); +} + +$out .= '</spellresult>'; + +header("Content-Type: text/xml; charset=".RCMAIL_CHARSET); +echo $out; +exit; + +?> |