jsonify: Support tweets.csv

Allow official archive tweets.csv as input to create Ebooks::Archive compatible JSON archive
2014-05-27 19:14:19 -04:00 · 2014-05-27 19:14:19 -04:00 · 74fd9c1e2e
commit 74fd9c1e2e
parent db453600be
1 changed files with 17 additions and 9 deletions
--- a/bin/ebooks
+++ b/bin/ebooks
@ -2,6 +2,7 @@
 # encoding: utf-8

 require 'twitter_ebooks'
+require 'csv'

 $debug = true

@ -154,16 +155,23 @@ STR

      tweets = []
      id = nil
-      File.read(path).split("\n").each do |l|
-        if l.start_with?('# ')
-          id = l.split('# ')[-1]
-        else
-          tweet = { text: l }
-          if id
-            tweet[:id] = id
-            id = nil
+      if path.split('.')[-1] == "csv" #from twitter archive
+        csv_archive = CSV.read(path, :headers=>:first_row)
+        tweets = csv_archive.map do |tweet|
+          { text: tweet['text'], id: tweet['tweet_id'] }
+        end
+      else
+        File.read(path).split("\n").each do |l|
+          if l.start_with?('# ')
+            id = l.split('# ')[-1]
+          else
+            tweet = { text: l }
+            if id
+              tweet[:id] = id
+              id = nil
+            end
+            tweets << tweet
          end
-          tweets << tweet
        end
      end