Last active
March 16, 2017 12:22
-
-
Save arandomic/b2b3103d2bb8cb0239da5478a5e69bd0 to your computer and use it in GitHub Desktop.
count words and symbols in some sentence on page
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
var sentence = document.getElementById("#sentence").innerHTML.toLowerCase(); | |
//Тупое приведение слов к нормальной форме: | |
var word_replacer = {'букв': 'буква', 'скобок': 'скобка', 'буквы': 'буква', 'пробелов': 'пробел', 'восклицательных': 'восклицательный', 'одна': 'один', 'две': 'два', 'знаков': 'знак', 'точки': 'точка', 'скобки': 'скобка', 'точек': 'точка', 'слова': 'слово', 'тысячи': 'тысяча', 'латинских': 'латинская', 'правых': 'правая', 'слов': 'слово', 'знака': 'знак', 'кавычек': 'кавычка', 'пробела': 'пробел', 'левых': 'левая', 'тысяч': 'тысяча', 'кавычки': 'кавычка', 'запятых': 'запятая', 'одно': 'один'}; | |
words = sentence.match(/([^\",.)(;!? \n]+)/g); | |
symbols = sentence.match(/([\",.)(;!? ]+)/g); | |
var words_counter = {}; | |
var symbol_counter = {}; | |
for (var word of words) | |
{ | |
if (word in word_replacer) | |
word = word_replacer[word] | |
if (word in words_counter) | |
words_counter[word]++; | |
else | |
words_counter[word]=1; | |
}; | |
for (var symbol of symbols) | |
{ | |
if (symbol in symbol_counter) | |
symbol_counter[symbol]++; | |
else | |
symbol_counter[symbol]=1; | |
} | |
console.log(JSON.stringify(words_counter)); | |
console.log(JSON.stringify(symbol_counter)); |
Sign up for free
to join this conversation on GitHub.
Already have an account?
Sign in to comment