jsonify: Support tweets.csv

Allow official archive tweets.csv as input to create Ebooks::Archive compatible JSON archive
2014-05-27 19:14:19 -04:00 · 2014-05-27 19:14:19 -04:00 · 74fd9c1e2e
commit 74fd9c1e2e
parent db453600be
1 changed files with 17 additions and 9 deletions
--- a/bin/ebooks
+++ b/bin/ebooks
@ -2,6 +2,7 @@
 # encoding: utf-8
 require 'twitter_ebooks'
 require 'csv'
 $debug = true
@ -154,16 +155,23 @@ STR
      tweets = []
      id = nil
-      File.read(path).split("\n").each do |l|
+      if path.split('.')[-1] == "csv" #from twitter archive
-        if l.start_with?('# ')
+        csv_archive = CSV.read(path, :headers=>:first_row)
-          id = l.split('# ')[-1]
+        tweets = csv_archive.map do |tweet|
-        else
+          { text: tweet['text'], id: tweet['tweet_id'] }
-          tweet = { text: l }
+        end
-          if id
+      else
-            tweet[:id] = id
+        File.read(path).split("\n").each do |l|
-            id = nil
+          if l.start_with?('# ')
            id = l.split('# ')[-1]
          else
            tweet = { text: l }
            if id
              tweet[:id] = id
              id = nil
            end
            tweets << tweet
          end
          tweets << tweet
        end
      end