plot-num-msg-by-time.py 1.4 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748
  1. #!/usr/bin/env python3
  2. # -*- coding: UTF-8 -*-
  3. from wechat.parser import WeChatDBParser
  4. from datetime import timedelta, datetime
  5. import matplotlib.pyplot as plt
  6. import sys
  7. if __name__ == '__main__':
  8. if len(sys.argv) != 3:
  9. sys.exit("Usage: {0} <path to decrypted_database.db> <name>".format(sys.argv[0]))
  10. db_file = sys.argv[1]
  11. name = sys.argv[2]
  12. every_k_days = 2
  13. parser = WeChatDBParser(db_file)
  14. msgs = parser.msgs_by_chat[name]
  15. times = [x.createTime for x in msgs]
  16. start_time = times[0]
  17. diffs = [(x - start_time).days for x in times]
  18. max_day = diffs[-1]
  19. width = 20
  20. numbers = range((max_day / width + 1) * width + 1)[::width]
  21. labels = [(start_time + timedelta(x)).strftime("%m/%d") for x in numbers]
  22. plt.xticks(numbers, labels)
  23. plt.xlabel("Date")
  24. plt.ylabel("Number of msgs in k days")
  25. plt.hist(diffs, bins=max_day / every_k_days)
  26. plt.show()
  27. # statistics by hour
  28. # I'm in a different time zone in this period:
  29. #TZ_DELTA = {(datetime(2014, 7, 13), datetime(2014, 10, 1)): -15}
  30. #def real_hour(x):
  31. #for k, v in TZ_DELTA.items():
  32. #if x > k[0] and x < k[1]:
  33. #print x
  34. #return (x.hour + v + 24) % 24
  35. #return x.hour
  36. #hours = [real_hour(x) for x in times]
  37. #plt.ylabel("Number of msgs")
  38. #plt.xlabel("Hour in a day")
  39. #plt.hist(hours, bins=24)
  40. #plt.show()