You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

23 lines
473 B

-- Aggregate the output from ngrams.lua.
-- Get the data from all shards.
counts = {}
dofile("/tmp/lua-output")
-- Put the data into a sortable "array".
countArray = {}
for ngram, count in pairs(counts) do
table.insert(countArray, {count, ngram})
end
-- Sort the data.
function compare(a, b)
return a[1] > b[1]
end
table.sort(countArray, compare)
-- Write the result.
for i, countPair in ipairs(countArray) do
io.write(countPair[1], "\t", countPair[2], "\n")
end