main.py 6.3 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150
  1. import datetime
  2. import psycopg2.extras
  3. import model
  4. from pprint import pprint
  5. import time
  6. import database
  7. import sys
  8. import view
  9. if __name__ == '__main__':
  10. row = -1
  11. if len(sys.argv) > 1:
  12. try:
  13. row = int(sys.argv[1])
  14. except ValueError:
  15. sys.exit(1)
  16. broadcast = True
  17. if len(sys.argv) > 2:
  18. broadcast = False
  19. start = time.time()
  20. db = database.db
  21. race_days_global = model.scrape_main_page(row)
  22. interim = time.time()
  23. # print('interim 1 {}'.format(interim - start))
  24. # pprint(race_days_global)
  25. race_days = []
  26. raw_data_dict = {}
  27. for race_day in race_days_global:
  28. raw_data = model.get_raw_scratchings(race_day)
  29. race_day_details = model.process_raw_data(raw_data, race_day)
  30. race_days.append(race_day_details)
  31. raw_data_dict[race_day.name] = raw_data
  32. interim = time.time()
  33. # print('interim 2 {}'.format(interim - start))
  34. # pprint(race_days)
  35. for race_day in race_days:
  36. if not raw_data_dict or not race_day:
  37. # raw_data_dict may be empty when there is no data available (yet)
  38. continue
  39. raw_data = raw_data_dict[race_day.name]
  40. scratchings = model.get_scratching_details(raw_data, race_day)
  41. if not scratchings:
  42. # model.get_scratchings_details may return empty
  43. continue
  44. # retrieve previous stored scratching for this venue / day
  45. query = "SELECT * FROM horses WHERE venue = %s AND race_date = %s;"
  46. cur1 = db.cursor(cursor_factory=psycopg2.extras.NamedTupleCursor)
  47. cur1.execute(query, (race_day.name, race_day.date))
  48. db_data = cur1.fetchall()
  49. # print(' 54. len(db_data): {}'.format(len(db_data)))
  50. # print(' 55. type(db_data): {}'.format(type(db_data)))
  51. # pprint(db_data)
  52. cur1.close()
  53. # compare retrieved scratchings with new data
  54. for scratching in scratchings:
  55. found_in_database = False
  56. if db_data is None:
  57. print(' 62. Caught db_data is None')
  58. found_in_database = False
  59. else:
  60. for row in db_data:
  61. # print('row: ', end = '')
  62. # print(type(row))
  63. # print(row)
  64. # if type(row) == 'datetime.time':
  65. # continue
  66. try:
  67. # if not hasattr(db_data, 'name'):
  68. # continue
  69. date_in_db_row_formatted = row.race_date.strftime('%Y-%m-%d')
  70. if (
  71. scratching.date == date_in_db_row_formatted and
  72. scratching.venue == row.venue and
  73. int(scratching.race) == int(row.race) and
  74. scratching.horse == row.horse
  75. ):
  76. message_string = 'Horse found: date = {}, venue = {}, race = {}, horse = {}'
  77. message = message_string.format(scratching.date,
  78. scratching.venue,
  79. scratching.race,
  80. scratching.horse)
  81. # print(message)
  82. # print(row)
  83. found_in_database = True
  84. except AttributeError as ae:
  85. print(ae)
  86. print(' 89. row: ', end='')
  87. print(row)
  88. pprint(db_data)
  89. continue
  90. if not found_in_database:
  91. # report new scratching
  92. date_object = datetime.datetime.strptime(scratching.date, "%Y-%m-%d").date()
  93. day_abbr = date_object.strftime('%a')
  94. query = """
  95. SELECT start_time, utctime, torn FROM race_program
  96. WHERE race_date = %s AND
  97. venue = %s AND
  98. race = %s;
  99. """
  100. cur2 = db.cursor(cursor_factory=psycopg2.extras.NamedTupleCursor)
  101. cur2.execute(query, (scratching.date, scratching.venue, scratching.race))
  102. db_data = cur2.fetchone()
  103. cur2.close()
  104. if db_data is None or len(db_data) == 0:
  105. print('106. cursor.execute(query, (scratching.date, scratching.venue, scratching.race))')
  106. print('107. cursor.execute({}, ({}, {}, {}))'.format(
  107. query, scratching.date, scratching.venue, scratching.race
  108. ))
  109. print('110. No race found')
  110. continue
  111. flag = ''
  112. if db_data.torn:
  113. flag = 'FLAGGED!! '
  114. message_string = '{}venue = {} {} {}-{} | race = {} starts at {} | {} UTC | horse = {}'
  115. message = message_string.format(flag,
  116. day_abbr,
  117. scratching.date,
  118. scratching.state,
  119. scratching.venue,
  120. scratching.race,
  121. db_data.start_time.strftime('%H:%M'),
  122. db_data.utctime.strftime('%H:%M'),
  123. scratching.horse)
  124. print(message)
  125. if broadcast:
  126. view.broadcast(message)
  127. # store new scratching
  128. query = """INSERT INTO horses(venue, race_date, race, horse)
  129. VALUES(%s, %s, %s, %s)
  130. ON CONFLICT(venue, race_date, race, horse) DO NOTHING;"""
  131. cur3 = db.cursor(cursor_factory=psycopg2.extras.NamedTupleCursor)
  132. cur3.execute(query, (scratching.venue, scratching.date,
  133. scratching.race, scratching.horse))
  134. cur3.close()
  135. print('Stored: {}'.format(scratching))
  136. time.sleep(0.5)
  137. db.commit()
  138. db.close()
  139. interim = time.time()
  140. # print('interim 3 {}'.format(interim - start))