aboutsummaryrefslogtreecommitdiff
path: root/exampleData
diff options
context:
space:
mode:
authorGravatar Rogan Creswick <creswick@gmail.com>2013-06-16 22:08:45 -0700
committerGravatar Rogan Creswick <creswick@gmail.com>2013-06-16 22:08:45 -0700
commit10fcc55c46753f1c1f3e2b5a2659263d7b64578e (patch)
tree48fd64f6ebfa064de431fc99480252c3a5e88f42 /exampleData
parentb5604498ce494199268290433960858266e67b10 (diff)
removed debugging statements from upGoerFive rule, caught some exceptions in HeadlessAtom
Diffstat (limited to 'exampleData')
-rw-r--r--exampleData/ruleSets/language-processing/natural/upGoerFive.js39
1 files changed, 17 insertions, 22 deletions
diff --git a/exampleData/ruleSets/language-processing/natural/upGoerFive.js b/exampleData/ruleSets/language-processing/natural/upGoerFive.js
index fb17a54..092a181 100644
--- a/exampleData/ruleSets/language-processing/natural/upGoerFive.js
+++ b/exampleData/ruleSets/language-processing/natural/upGoerFive.js
@@ -1,6 +1,6 @@
var natural = require('natural');
-rule = {};
+rule = {};
rule.name = "Common words";
rule.description = "Identifies rare word use (words not in the 1000 most common English word list).";
@@ -144,25 +144,25 @@ var stemmer = natural.PorterStemmer;
var tokenizer = new natural.TreebankWordTokenizer();
var getTextNodesIn = function (node, includeWhitespaceNodes) {
- var textNodes = [], whitespace = /^\s*$/;
+ var textNodes = [], whitespace = /^\s*$/;
- function getTextNodes(node) {
- if ($(node).attr('id') == 'fiveui-top') {
- return;
- }
- if (node.nodeType == 3) {
- if (includeWhitespaceNodes || !whitespace.test(node.nodeValue)) {
- textNodes.push(node);
- }
- } else {
- for (var i = 0, len = node.childNodes.length; i < len; ++i) {
- getTextNodes(node.childNodes[i]);
- }
- }
+ function getTextNodes(node) {
+ if ($(node).attr('id') == 'fiveui-top') {
+ return;
}
+ if (node.nodeType == 3) {
+ if (includeWhitespaceNodes || !whitespace.test(node.nodeValue)) {
+ textNodes.push(node);
+ }
+ } else {
+ for (var i = 0, len = node.childNodes.length; i < len; ++i) {
+ getTextNodes(node.childNodes[i]);
+ }
+ }
+ }
- getTextNodes(node);
- return textNodes;
+ getTextNodes(node);
+ return textNodes;
};
var isCommonWord = function(word) {
@@ -173,11 +173,9 @@ var isPunctuation = function(str) {
return _.contains(['&', '%', '(', ')', ';', ':', '.', ',', '"', "'", '`', '!', '?' ], str);
};
-
var markWords = function(obj, report) {
var toks = tokenizer.tokenize($(obj).text());
var rawObj = $('<p></p>', {id: 'text'});
-// $(obj).empty();
$(obj).replaceWith(rawObj);
_.each(toks, function(tok) {
@@ -192,14 +190,11 @@ var markWords = function(obj, report) {
};
rule.rule = function(report) {
- console.log("checking for rare words");
fiveui.query('body').each(
function(i){
var nodes = getTextNodesIn(this);
_.map(nodes, function(n){
- console.log(n);
markWords(n, report);
});
});
- console.log("done checking for rare words");
}; \ No newline at end of file