twitter-ebooks/script/process_anc_data.rb
2013-11-08 06:02:05 +11:00

19 lines
316 B
Ruby
Executable file

#!/usr/bin/env ruby
# encoding: utf-8
require 'json'
freqmap = {}
data = File.read("data/ANC-all-count.txt")
data = data.unpack("C*").pack("U*")
data.lines.each do |l|
vals = l.split("\t")
freqmap[vals[0]] = vals[-1].to_i
end
File.open("data/wordfreq.json", 'w') do |f|
f.write(JSON.dump(freqmap))
end