data_processing.py 4.5 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121
  1. import json
  2. import pandas as pd
  3. import time
  4. import queue
  5. import threading
  6. # Initialize the DataFrame
  7. df_trades = pd.DataFrame(columns=['price', 'qty', 'timestamp'])
  8. df_order_book = pd.DataFrame(columns=['bid_price', 'bid_qty', 'ask_price', 'ask_qty'])
  9. previous_order_book = None
  10. fill_probabilities = {}
  11. order_disappearances = {}
  12. order_executions = {}
  13. last_trade = {'price': None, 'qty': None, 'side': None}
  14. messages = queue.Queue() # 创建一个线程安全队列
  15. stop_event = threading.Event()
  16. def on_message_trade(_ws, message):
  17. global df_trades, order_executions, last_trade
  18. json_message = json.loads(message)
  19. trade = {
  20. 'price': float(json_message['p']),
  21. 'qty': float(json_message['q']),
  22. 'timestamp': pd.to_datetime(json_message['T'], unit='ms'),
  23. 'side': 'buy' if json_message['m'] else 'sell' # 'm' indicates是否买方是做市商
  24. }
  25. trade_df = pd.DataFrame([trade])
  26. if not trade_df.empty and not trade_df.isna().all().all():
  27. df_trades = pd.concat([df_trades, trade_df], ignore_index=True)
  28. # 记录每个价格的实际成交总量
  29. price = trade['price']
  30. last_trade = {'price': price, 'qty': trade['qty'], 'side': trade['side']}
  31. if price not in order_executions:
  32. order_executions[price] = 0
  33. order_executions[price] += trade['qty']
  34. calculate_fill_probabilities()
  35. def on_message_depth(_ws, message):
  36. global df_order_book, order_disappearances, previous_order_book
  37. json_message = json.loads(message)
  38. bids = json_message['bids'][:10] # Top 10 bids
  39. asks = json_message['asks'][:10] # Top 10 asks
  40. order_book = {
  41. 'bid_price': [float(bid[0]) for bid in bids],
  42. 'bid_qty': [float(bid[1]) for bid in bids],
  43. 'ask_price': [float(ask[0]) for ask in asks],
  44. 'ask_qty': [float(ask[1]) for ask in asks]
  45. }
  46. df_order_book = pd.DataFrame([order_book])
  47. if previous_order_book is not None:
  48. # 计算订单消失量
  49. for level in range(10):
  50. bid_price = df_order_book['bid_price'].iloc[0][level]
  51. ask_price = df_order_book['ask_price'].iloc[0][level]
  52. bid_qty = df_order_book['bid_qty'].iloc[0][level]
  53. ask_qty = df_order_book['ask_qty'].iloc[0][level]
  54. prev_bid_qty = previous_order_book['bid_qty'].iloc[0][level]
  55. prev_ask_qty = previous_order_book['ask_qty'].iloc[0][level]
  56. # 计算bid订单消失量
  57. if bid_price not in order_disappearances:
  58. order_disappearances[bid_price] = 0
  59. if prev_bid_qty > bid_qty:
  60. order_disappearances[bid_price] += (prev_bid_qty - bid_qty)
  61. # 计算ask订单消失量
  62. if ask_price not in order_disappearances:
  63. order_disappearances[ask_price] = 0
  64. if prev_ask_qty > ask_qty:
  65. order_disappearances[ask_price] += (prev_ask_qty - ask_qty)
  66. previous_order_book = df_order_book
  67. calculate_fill_probabilities()
  68. # 计算成交概率
  69. def calculate_fill_probabilities():
  70. global order_executions, order_disappearances, fill_probabilities
  71. fill_probabilities = {}
  72. for price in order_disappearances:
  73. if price in order_executions:
  74. disappearances = order_disappearances[price]
  75. executions = order_executions[price]
  76. # 确保成交概率不大于1
  77. fill_probabilities[price] = min(executions / disappearances, 1) if disappearances > 0 else 0
  78. else:
  79. fill_probabilities[price] = 0
  80. # 定期记录和保存成交概率
  81. def log_and_save_fill_probabilities():
  82. global df_order_book, fill_probabilities
  83. while not stop_event.is_set():
  84. if fill_probabilities and not df_order_book.empty:
  85. asks = [[price, fill_probabilities[price]] for price in df_order_book['ask_price'].iloc[0] if
  86. price in fill_probabilities]
  87. bids = [[price, fill_probabilities[price]] for price in df_order_book['bid_price'].iloc[0] if
  88. price in fill_probabilities]
  89. last_price = last_trade['price']
  90. last_qty = last_trade['qty']
  91. side = last_trade['side']
  92. data = {
  93. "asks": asks,
  94. "bids": bids,
  95. "last_price": last_price,
  96. "last_qty": last_qty,
  97. "side": side,
  98. "time": int(time.time() * 1000)
  99. }
  100. messages.put(data)
  101. # logger.info("Market Snapshot:\n%s", json.dumps(data))
  102. stop_event.wait(0.1)