aboutsummaryrefslogtreecommitdiffhomepage
path: root/tools/lua/ngrams_aggregate.lua
blob: f8c93381495badfa80079858cf361afaf53650ae (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
-- Aggregate the output from ngrams.lua.

-- Get the data from all shards.
counts = {}
dofile("/tmp/lua-output")

-- Put the data into a sortable "array".
countArray = {}
for ngram, count in pairs(counts) do
  table.insert(countArray, {count, ngram})
end

-- Sort the data.
function compare(a, b)
  return a[1] > b[1]
end
table.sort(countArray, compare)

-- Write the result.
for i, countPair in ipairs(countArray) do
  io.write(countPair[1], "\t", countPair[2], "\n")
end