You can not select more than 25 topics
Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
23 lines
473 B
23 lines
473 B
-- Aggregate the output from ngrams.lua.
|
|
|
|
-- Get the data from all shards.
|
|
counts = {}
|
|
dofile("/tmp/lua-output")
|
|
|
|
-- Put the data into a sortable "array".
|
|
countArray = {}
|
|
for ngram, count in pairs(counts) do
|
|
table.insert(countArray, {count, ngram})
|
|
end
|
|
|
|
-- Sort the data.
|
|
function compare(a, b)
|
|
return a[1] > b[1]
|
|
end
|
|
table.sort(countArray, compare)
|
|
|
|
-- Write the result.
|
|
for i, countPair in ipairs(countArray) do
|
|
io.write(countPair[1], "\t", countPair[2], "\n")
|
|
end
|