diff options
author | friendica <info@friendica.com> | 2012-01-31 15:54:41 -0800 |
---|---|---|
committer | friendica <info@friendica.com> | 2012-01-31 15:54:41 -0800 |
commit | c8c062d96024a23e67e73f1ebffcf7009b18eed1 (patch) | |
tree | ec8382bc177f4f8be6516ab8d2e420088d6f9733 /library/spam/example | |
parent | 4fc455d195fef9f1bfbc9f125788650fb3153237 (diff) | |
download | volse-hubzilla-c8c062d96024a23e67e73f1ebffcf7009b18eed1.tar.gz volse-hubzilla-c8c062d96024a23e67e73f1ebffcf7009b18eed1.tar.bz2 volse-hubzilla-c8c062d96024a23e67e73f1ebffcf7009b18eed1.zip |
add spam engine
Diffstat (limited to 'library/spam/example')
-rw-r--r-- | library/spam/example/index.php | 241 |
1 files changed, 241 insertions, 0 deletions
diff --git a/library/spam/example/index.php b/library/spam/example/index.php new file mode 100644 index 000000000..6d3c14260 --- /dev/null +++ b/library/spam/example/index.php @@ -0,0 +1,241 @@ +<?php + +# Copyright (C) 2006-2010 Tobias Leupold <tobias.leupold@web.de> +# +# This file is part of the b8 package +# +# This program is free software; you can redistribute it and/or modify it +# under the terms of the GNU Lesser General Public License as published by +# the Free Software Foundation in version 2.1 of the License. +# +# This program is distributed in the hope that it will be useful, but +# WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY +# or FITNESS FOR A PARTICULAR PURPOSE. See the GNU Lesser General Public +# License for more details. +# +# You should have received a copy of the GNU Lesser General Public License +# along with this program; if not, write to the Free Software Foundation, +# Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307, USA. + + +### This is an example script demonstrating how b8 can be used. ### + +#/* + +# Use this code block if you want to use Berkeley DB. + +# The database filename is interpreted relative to the b8.php script location. + +$config_b8 = array( + 'storage' => 'dba' +); + +$config_database = array( + 'database' => 'wordlist.db', + 'handler' => 'db4' +); + +#*/ + +/* + +# Use this code block if you want to use MySQL. + +# An existing link resource can be passed to b8 by setting +# $config_database['connection'] to this link resource. +# Be sure to set your database access data otherwise! + +$config_b8 = array( + 'storage' => 'mysql' +); + +$config_database = array( + 'database' => 'test', + 'table_name' => 'b8_wordlist', + 'host' => 'localhost', + 'user' => '', + 'pass' => '' +); + +*/ + +# To be able to calculate the time the classification took + +$time_start = NULL; + +function microtimeFloat() +{ + list($usec, $sec) = explode(" ", microtime()); + return ((float) $usec + (float) $sec); +} + +# Output a nicely colored rating + +function formatRating($rating) +{ + + if($rating === FALSE) + return "<span style=\"color:red\">could not calculate spaminess</span>"; + + $red = floor(255 * $rating); + $green = floor(255 * (1 - $rating)); + + return "<span style=\"color:rgb($red, $green, 0);\"><b>" . sprintf("%5f", $rating) . "</b></span>"; + +} + +echo <<<END +<?xml version="1.0" encoding="UTF-8"?> + +<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.1//EN" + "http://www.w3.org/TR/xhtml11/DTD/xhtml11.dtd"> + +<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en"> + +<head> + +<title>example b8 interface</title> + +<meta http-equiv="content-type" content="text/html; charset=UTF-8" /> + +<meta name="dc.creator" content="Tobias Leupold" /> +<meta name="dc.rights" content="Copyright (c) by Tobias Leupold" /> + +</head> + +<body> + +<div> + +<h1>example b8 interface</h1> + + +END; + +$postedText = ""; + +if(isset($_POST['action']) and $_POST['text'] == "") + echo "<p style=\"color:red;\"><b>Please type in a text!</b></p>\n\n"; + +elseif(isset($_POST['action']) and $_POST['text'] != "") { + + $time_start = microtimeFloat(); + + # Include the b8 code + require dirname(__FILE__) . "/../b8/b8.php"; + + # Create a new b8 instance + $b8 = new b8($config_b8, $config_database); + + # Check if everything worked smoothly + + $started_up = $b8->validate(); + + if($started_up !== TRUE) { + echo "<b>example:</b> Could not initialize b8. error code: $started_up"; + exit; + } + + $text = stripslashes($_POST['text']); + $postedText = htmlentities($text, ENT_QUOTES, 'UTF-8'); + + switch($_POST['action']) { + + case "Classify": + echo "<p><b>Spaminess: " . formatRating($b8->classify($text)) . "</b></p>\n"; + break; + + case "Save as Spam": + + $ratingBefore = $b8->classify($text); + $b8->learn($text, b8::SPAM); + $ratingAfter = $b8->classify($text); + + echo "<p>Saved the text as Spam</p>\n\n"; + + echo "<div><table>\n"; + echo "<tr><td>Classification before learning:</td><td>" . formatRating($ratingBefore) . "</td></tr>\n"; + echo "<tr><td>Classification after learning:</td><td>" . formatRating($ratingAfter) . "</td></tr>\n"; + echo "</table></div>\n\n"; + + break; + + case "Save as Ham": + + $ratingBefore = $b8->classify($text); + $b8->learn($text, b8::HAM); + $ratingAfter = $b8->classify($text); + + echo "<p>Saved the text as Ham</p>\n\n"; + + echo "<div><table>\n"; + echo "<tr><td>Classification before learning:</td><td>" . formatRating($ratingBefore) . "</td></tr>\n"; + echo "<tr><td>Classification after learning:</td><td>" . formatRating($ratingAfter) . "</td></tr>\n"; + echo "</table></div>\n\n"; + + break; + + case "Delete from Spam": + $b8->unlearn($text, b8::SPAM); + echo "<p style=\"color:green\">Deleted the text from Spam</p>\n\n"; + break; + + case "Delete from Ham": + $b8->unlearn($text, b8::HAM); + echo "<p style=\"color:green\">Deleted the text from Ham</p>\n\n"; + break; + + } + + $mem_used = round(memory_get_usage() / 1048576, 5); + $peak_mem_used = round(memory_get_peak_usage() / 1048576, 5); + $time_taken = round(microtimeFloat() - $time_start, 5); + +} + +echo <<<END +<div> +<form action="{$_SERVER['PHP_SELF']}" method="post"> +<div> +<textarea name="text" cols="50" rows="16">$postedText</textarea> +</div> +<table> +<tr> +<td><input type="submit" name="action" value="Classify" /></td> +</tr> +<tr> +<td><input type="submit" name="action" value="Save as Spam" /></td> +<td><input type="submit" name="action" value="Save as Ham" /></td> +</tr> +<tr> +<td><input type="submit" name="action" value="Delete from Spam" /></td> +<td><input type="submit" name="action" value="Delete from Ham" /></td> +</tr> +</table> +</form> +</div> + +</div> + +END; + +if($time_start !== NULL) { + +echo <<<END +<div> +<table border="0"> +<tr><td>Memory used: </td><td>$mem_used MB</td></tr> +<tr><td>Peak memory used:</td><td>$peak_mem_used MB</td></tr> +<tr><td>Time taken: </td><td>$time_taken sec</td></tr> +</table> +</div> + +END; + +} + +?> + +</body> + +</html> |