javascript - Faster way to find an occurrence of 2-Dimensional array of keywords with frequency value - Stack Overflow

IT技术

更新时间：2025-04-060

admin管理员组
文章数量:1355031

Do I have a faster way to count all frequency of all elements in 2-Dimensional array? Like this sample:

var array = [["a", "b"]["c", "d"]["b", "d"]["c", "a", "b"], ["a", "b", "c", "d"];

My expected result would be an array of objects contain keyword and frequency value.
Like this,

result = [{ keyword: "a",
            frequency: 3
          }, {
            keyword: "b",
            frequency: 4
          }, ... ];

Here is my solution:

function generateData (records) {
  var data = [];
  for (var i = 0; i < records; ++i) {
      data.push(["a", "b", "c", "d", "e"]);
  }
  // some gap to insert data
  setTimeout(function () {
  }, Math.random() * 1000);
  return data;
}

function mine (data) {
  var result = [];
  data.forEach( function (keywords) {
      for (var i = 0, len = keywords.length; i < len; ++i) {
          var pos = result.map( function (x) {
              return x.keyword;
          }).indexOf(keywords[i]);

          if (pos == -1) {
              var newKeyword = {
                  keyword: keywords[i],
                  frequency: 1
              }
              result.push(newKeyword);
          } else { 
              result[pos].frequency += 1;
          }
      }
  });
  return result;
}

var dataset = generateData(50000);

var start = performance.now();
var result = mine(dataset);
var end = performance.now();

console.log(result);
console.log("Total time: " + (end - start) + " milliseconds.");

Do I have a faster way to count all frequency of all elements in 2-Dimensional array? Like this sample:

var array = [["a", "b"]["c", "d"]["b", "d"]["c", "a", "b"], ["a", "b", "c", "d"];

My expected result would be an array of objects contain keyword and frequency value.
Like this,

result = [{ keyword: "a",
            frequency: 3
          }, {
            keyword: "b",
            frequency: 4
          }, ... ];

Here is my solution:

function generateData (records) {
  var data = [];
  for (var i = 0; i < records; ++i) {
      data.push(["a", "b", "c", "d", "e"]);
  }
  // some gap to insert data
  setTimeout(function () {
  }, Math.random() * 1000);
  return data;
}

function mine (data) {
  var result = [];
  data.forEach( function (keywords) {
      for (var i = 0, len = keywords.length; i < len; ++i) {
          var pos = result.map( function (x) {
              return x.keyword;
          }).indexOf(keywords[i]);

          if (pos == -1) {
              var newKeyword = {
                  keyword: keywords[i],
                  frequency: 1
              }
              result.push(newKeyword);
          } else { 
              result[pos].frequency += 1;
          }
      }
  });
  return result;
}

var dataset = generateData(50000);

var start = performance.now();
var result = mine(dataset);
var end = performance.now();

console.log(result);
console.log("Total time: " + (end - start) + " milliseconds.");

Does anyone have a faster way to solve this problem? Note: With 2-Dimensional of keywords array (around ~50,000 records).

Share Improve this question edited Jan 18, 2019 at 6:45 asked Jan 18, 2019 at 6:00 Parn 9187 silver badges19 bronze badges

Add a ment |

5 Answers 5

Sorted by: Reset to default 5

You can use .reduce() to get the desired frequency in the form of an object:

let data = [
  ["a", "b"],
  ["c", "d"],
  ["b", "d"],
  ["c", "a", "b"],
  ["a", "b", "c", "d"]
];

let result = [].concat(...data).reduce((r, c) => (r[c] = (r[c] || 0) + 1, r), {});

console.log(result);

If this really is a bottleneck and squeezing speed out of the counting is worth code that's not quite as pretty as the functional solutions, you will have a hard time beating for loops in today's javascript engines. In my tests this is about twice as fast as using reduce():

var array = [["a", "b"],["c", "d"],["b", "d"],["c", "a", "b"], ["a", "b", "c", "d"]];

let counts = new Map()
for (let i = 0; i < array.length; i++){
    for (let j = 0; j < array[i].length; j++){
        let n = counts.get(array[i][j]) || 0
        counts.set(array[i][j], n + 1)
    }
}

JSperf Benchmark here

You could simplify it to something like this using flat and reduce:

const input = [["a", "b"],["c", "d"],["b", "d"],["c", "a", "b"],["a", "b", "c", "d"]]

,output = input.flat().reduce((acc, a) =>
  ((acc[a] = acc[a] || {keyword: a, frequency: 0})["frequency"]++, acc)
,{})

console.log(Object.values(output))

If flat isn't supported, use [].concat(...input).reduce()

You can reduce plexity by storing words in a map, then iterating on the map at the end. This saves iterating on the result for every word

Old plexity O(N * M * R) array * word in each group * result New plexity O(N*M + R)

Note: Array.prototype.concat, I believe, has a big runtime. For each concat, a new object is created and the existing and new values are copied into that new object and returned. That's why the old arrays are not modified. So values are read over and over.

var array = [["a", "b"],["c", "d"],["b", "d"],["c", "a", "b"], ["a", "b", "c", "d"]];
var resultMap = {};
array.forEach(function (keywords) {
    keywords.forEach(function(word, i){
    if(resultMap[word]) {
        resultMap[word].frequency = resultMap[word].frequency + 1;
    }
    else{
        resultMap[word] = {
        keyword: word,
        frequency: 1
      };
    }
  });
});

console.log(Object.values(resultMap));

Here I convert the original array to string and then count the character into another array as a result.

const array = [
  ["a", "b"],
  ["c", "d"],
  ["b", "d"],
  ["c", "a", "b"],
  ["a", "b", "c", "d"]
]
let result = array.join().replace(/[ ]/g, '').split(',')
let count = {}
result.forEach(c => count[c] = (count[c] || 0) + 1)
console.log(count)

本文标签：

版权声明：本文标题：javascript - Faster way to find an occurrence of 2-Dimensional array of keywords with frequency value - Stack Overflow 内容由网友自发贡献，该文观点仅代表作者本人，转载请联系作者并注明出处：http://www.betaflare.com/web/1743942103a2565749.html，本站仅提供信息存储空间服务，不拥有所有权，不承担相关法律责任。如发现本站有涉嫌抄袭侵权/违法违规的内容，一经查实，本站将立刻删除。

发表评论

全部评论 0

暂无评论

编程频道|软件玩家 - 软件改变生活！

javascript - Faster way to find an occurrence of 2-Dimensional array of keywords with frequency value - Stack Overflow

5 Answers 5

更多相关文章

vue.js - Nuxt 3 - linting error when using typescript types - Stack Overflow

javascript - Multiple queries in a loop Parse Cloud Code - Stack Overflow

Fade into black jQuery or Javascript effect? Exists? - Stack Overflow

javascript - Break on &quot;innerHTML&quot; changes in Chrome - Stack Overflow

c# - How to create a date in JavascriptJQuery from day, month and year? - Stack Overflow

javascript - Click on label - Pie chart jQuery Flot - Stack Overflow

javascript - How do I scale this layout? - Stack Overflow

swift - Agora iOS SDK Upgrade Breaking Voice Call Feature (Delegate Methods Not Called) in XCode 16+ - Stack Overflow

c - OpenSSL tpm2 provider - support for password protected TPM private key - Stack Overflow

jquery - JavaScript: get cursor position in contenteditable div - Stack Overflow

Rails development not showing error trace - Stack Overflow

android - Compile MAUI .NET 9 project with external DLL - Stack Overflow

sorting of array manually in javascript - Stack Overflow

javascript - Why does ~-1 equal 0 and ~1 equal -2? - Stack Overflow

json - Should I go with if-else or match-case in the below scenario? - Stack Overflow

azure webapps - Is it possible to check scale up logs - Stack Overflow

javascript - Open a new HTML page in a JS function and then write some HTML on it - Stack Overflow

javascript - Angular material Snackbar configuration with custom panelClass configuration for error, success, warning messages -

javascript - How to scroll to a specific component in React JS - Stack Overflow

javascript - Chrome Network Error - Downloading PDF - Stack Overflow

发表评论

推荐文章

push() method not working properly in JavaScript - Stack Overflow

Can you call JavaScript function from PHP loop? - Stack Overflow

javascript - set readonly attribute to keep the input editable - Stack Overflow

php - Hidden checkbox input values are not sent :( - Stack Overflow

reactjs - Responsive CSS sprite animation background - Stack Overflow

热门文章

javascript - Regex: Email validation that allows only hyphens in the middle of the domain and top-level domain - Stack Overflow

javascript - How to fetch API and Display data in my html code? - Stack Overflow

node.js - How to set initial memory size in node 22? - Stack Overflow

javascript - How do I combine puppeteer plugins with puppeteer clusters? - Stack Overflow

javascript - html link hover not working after link visited? - Stack Overflow

jquery - Steam API Get SteamID using Javascript - Stack Overflow

javascript - Uncaught TypeError: Cannot read property &#39;call&#39; of undefined after webpack rebuild CommonsChunkPlug

Javascript to remove trailing &amp;nbsp; - Stack Overflow

javascript - Cannot use getActiveObject() in Fabric.js - Stack Overflow

javascript - Filter array of objects if object contains attribute with value present in another array - Stack Overflow

最新文章

win11玩游戏找不到d3dx9怎么办？多种dll问题解决方法分享

使用U盘安装Ubuntu（Linux系统）保姆教程

u启动linux安装教程,u启动制作linux安装系统教程

Lenovo 50-80安装系统教程

上网问题：dns_probe_finished_no_internet

javascript - Summernote add fontsize to toolbar - Stack Overflow

typescript - Mendix nested object detection in pluggable widget - Stack Overflow

javascript - Chrome Network Error - Downloading PDF - Stack Overflow

class - How do you use a function to create an Object with Javascript? - Stack Overflow

javascript - Add multiple numbers to Array - Stack Overflow

惠普OMEN 15-CE001TX 2EF91PA参数报价

苹果新款MacBook Pro 15英寸 i732GB1TBVega Pro 20参数报价

联想Y330A-PSE L参数报价

神舟战神Z7 D6 i7-12650H16GB512GBRTX4050旗舰版参数报价

神舟战神Z7 D6 i7-12650H16GB1TBRTX4050参数报价

javascript - Break on "innerHTML" changes in Chrome - Stack Overflow

javascript - Uncaught TypeError: Cannot read property 'call' of undefined after webpack rebuild CommonsChunkPlug

Javascript to remove trailing   - Stack Overflow