DBManager.py 18 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368
  1. '''
  2. 暂时采用http方式获取历史数据。
  3. 预留:后期若改用通过访问数据库的形式进行数据的获取,则本文件负责数据库的连接,sql指令的执行,数据获取等功能。
  4. '''
  5. __author__ = 'lmstack'
  6. import time
  7. import datetime
  8. import time
  9. import pandas as pd
  10. import numpy as np
  11. import json
  12. import requests
  13. import pymysql
  14. import pdb
  15. class DBManager():
  16. def __init__(self, host='', port='', auth='', db='', username='', password=''):
  17. self.host = host
  18. self.port = port
  19. self.auth = auth
  20. self.db = db
  21. self.username = username
  22. self.password = password
  23. pass
  24. def __enter__(self):
  25. self.connect()
  26. return self
  27. def __exit__(self):
  28. self.close()
  29. def connect(self):
  30. conn_success_flag = 0
  31. while not conn_success_flag:
  32. try:
  33. self.conn = pymysql.connect(host=self.host, port=self.port, user=self.user, password=self.password, database=self.db)
  34. except Exception as e:
  35. conn_success_flag = 0
  36. print("数据库连接失败 :{}".format(e))
  37. time.sleep(5)
  38. else:
  39. conn_success_flag = 1
  40. self.cursor = self.conn.cursor()
  41. def close(self):
  42. try:
  43. self.conn.close()
  44. except Exception as e:
  45. print(e)
  46. else:
  47. print('数据库已断开连接')
  48. def add(table, keyvalue):
  49. fields_str = ''
  50. values_str = ''
  51. for k,v in keyvalue.items():
  52. fields_str += k+' '
  53. sql = 'insert into table {} ({}) values ({})'.format(table, fields_str, values_str)
  54. # 以下各个函数实现 通过http方式获取数据
  55. @staticmethod
  56. def _get_var_name(cellnum,Tempnum,Othernum):
  57. temp = []
  58. for i in range(cellnum):
  59. temp.append('单体电压'+str(i+1))
  60. for i in range(Tempnum):
  61. temp.append('单体温度'+str(i+1))
  62. for i in range(Othernum):
  63. temp.append('其他温度'+str(i+1))
  64. return temp
  65. @staticmethod
  66. def _download_json_data(url):
  67. '''
  68. 返回json数据的生成器,一次一行
  69. '''
  70. i = 0
  71. while 1:
  72. try:
  73. r = requests.get(url, stream=True, timeout=100, headers={'Connection':'close'})
  74. break
  75. except requests.exceptions.RequestException as e:
  76. if (i == 0):
  77. print()
  78. print('\r' + 'Server Error, retry {}......'.format(str(i)), end=" ")
  79. time.sleep(5)
  80. i+=1
  81. # print(r.content)
  82. # pdb.set_trace()
  83. for line in r.iter_lines():
  84. if line:
  85. yield json.loads(line)
  86. @staticmethod
  87. def _convert_to_dataframe_bms(data, mode=0):
  88. CellU = []
  89. CellT = []
  90. OtherT = []
  91. CellU_Num = 0
  92. CellT_Num = 0
  93. OtherT_Num = 0
  94. CellU_Num = len(data['ffBatteryStatus']['cellVoltageList'])
  95. CellT_Num = len(data['ffBatteryStatus']['cellTempList'])
  96. try:
  97. OtherT_Num = len(data['ffBatteryStatus']['otherTempList'])
  98. except:
  99. OtherT_Num = 0
  100. for i in range(CellU_Num):
  101. CellU.append(data['ffBatteryStatus']['cellVoltageList'][i]*1000)
  102. for i in range(CellT_Num):
  103. CellU.append(data['ffBatteryStatus']['cellTempList'][i])
  104. for i in range(OtherT_Num):
  105. CellU.append(data['ffBatteryStatus']['otherTempList'][i])
  106. if mode == 0:
  107. data_len = 15
  108. data_block = np.array([data['info']['obdTime'],data['ffBatteryStatus']['rssi'],data['ffBatteryStatus']['errorLevel'],data['ffBatteryStatus']['errorCode']
  109. ,data['ffBatteryStatus']['current'],data['ffBatteryStatus']['voltageInner'],data['ffBatteryStatus']['voltageOutter'],
  110. data['ffBatteryStatus']['totalOutputState'],data['ffBatteryStatus']['lockedState'],
  111. data['ffBatteryStatus']['chargeState'],data['ffBatteryStatus']['heatState'],data['ffBatteryStatus']['cellVoltageDiff']
  112. ,data['ffBatteryStatus']['soc'],data['ffBatteryStatus']['soh'],data['ffBatteryStatus']['cellVolBalance']]).reshape(1,data_len)
  113. elif mode == 1:
  114. data_len = 11
  115. data_block = np.array([data['info']['obdTime'],data['ffBatteryStatus']['rssi']
  116. ,data['ffBatteryStatus'].get('errorLevel'),data['ffBatteryStatus'].get('errorCode'),data['ffBatteryStatus']['switchState']
  117. ,data['ffBatteryStatus']['current'],data['ffBatteryStatus']['voltageInner'],data['ffBatteryStatus']['chargeState'],
  118. data['ffBatteryStatus']['cellVoltageDiff'],data['ffBatteryStatus']['soc'],data['ffBatteryStatus']['soh']]).reshape(1,data_len)
  119. data_block = np.append(data_block,CellU)
  120. data_block = np.append(data_block,CellT)
  121. data_block = np.append(data_block,OtherT)
  122. data_block = data_block.reshape(1,len(data_block))
  123. return data_block,CellU_Num,CellT_Num,OtherT_Num
  124. @staticmethod
  125. def _convert_to_dataframe_gps(data, mode=0):
  126. if mode == 0:
  127. if data['info']['subType'] == 1:
  128. data_block = np.array([data['info']['obdTime'],data['ffGps']['locationType'], data['ffGps']['satellites'],
  129. data['ffGps']['latitude'],data['ffGps']['longitude'],data['ffGps']['speed'],
  130. data['ffGps']['altitude'], data['ffGps']['direction']]).reshape(1,8)
  131. df = pd.DataFrame(
  132. columns=['时间戳','定位类型', '卫星数','纬度','经度','速度[km/h]','海拔','航向'],data=data_block)
  133. elif data['info']['subType'] == 2:
  134. df = pd.DataFrame(
  135. columns=['时间戳','定位类型', '卫星数','纬度','经度','速度[km/h]','海拔','航向'])
  136. if mode == 1:
  137. data_block = np.array([data['info']['obdTime'],data['ffGps']['locationType'],data['ffGps']['latitude'],data['ffGps']['longitude']
  138. ,data['ffGps']['speed'], data['ffGps']['isValid']]).reshape(1,6)
  139. df = pd.DataFrame(
  140. columns=['时间戳','定位类型', '纬度','经度','速度[km/h]','有效位'],data=data_block)
  141. return df
  142. @staticmethod
  143. def _convert_to_dataframe_system(data, mode=0):
  144. if mode == 0:
  145. data_block = np.array([data['info']['obdTime'],data['ffSystemInfo']['heatTargetTemp'], data['ffSystemInfo']['heatTimeout'],
  146. time.strftime('%Y-%m-%d %H:%M:%S',time.localtime(int(data['ffSystemInfo']['rentalStartTime'])/1000)),
  147. data['ffSystemInfo']['rentalPeriodDays'],data['ffSystemInfo']['bmsInterval'],
  148. data['ffSystemInfo']['gpsInterval']]).reshape(1,7)
  149. df = pd.DataFrame(
  150. columns=['时间戳','加热目标温度', '加热超时','租赁开始时间','租赁天数','bms上传周期','gps上传周期'],data=data_block)
  151. if mode == 1:
  152. df = pd.DataFrame()
  153. return df
  154. @staticmethod
  155. def _convert_to_dataframe_accum(data, mode=0):
  156. if mode == 0:
  157. data_block = np.array([data['info']['obdTime'],data['ffBatteryAccum']['SOH_AlgUnexTime'], data['ffBatteryAccum']['CHG_AHaccum'],
  158. data['ffBatteryAccum']['CHG_PHaccum'], data['ffBatteryAccum']['DSG_AHaccum'],
  159. data['ffBatteryAccum']['DSG_PHaccum'],data['ffBatteryAccum']['OverTemp_CHG_AHaccum'],
  160. data['ffBatteryAccum']['OverTemp_CHG_PHaccum']]).reshape(1,8)
  161. df = pd.DataFrame(
  162. columns=['时间戳','SOH未标定时间', '累计充电电量','累计充电能量','累计放电电量','累计放电能量',
  163. '累计高温充电电量', '累计高温充电能量'],data=data_block)
  164. if mode == 1:
  165. data_block = np.array([data['info']['obdTime'], data['ffBatteryAccum']['CHG_AHaccum'],
  166. data['ffBatteryAccum']['CHG_PHaccum'], data['ffBatteryAccum']['DSG_AHaccum'],
  167. data['ffBatteryAccum']['DSG_PHaccum'],data['ffBatteryAccum']['totalMileage']]).reshape(1,6)
  168. df = pd.DataFrame(
  169. columns=['时间戳','累计充电电量','累计充电能量','累计放电电量','累计放电能量', '累积里程'],data=data_block)
  170. return df
  171. @staticmethod
  172. def _get_data(urls,type_name,mode=0):
  173. if type_name == 'bms':
  174. if mode == 0:
  175. name_const = ['时间戳','GSM信号','故障等级','故障代码','总电流[A]','总电压[V]', '外电压', '总输出状态', '上锁状态', '充电状态','加热状态',
  176. '单体压差', 'SOC[%]','SOH[%]','单体均衡状态']
  177. elif mode == 1:
  178. name_const = ['时间戳','GSM信号','故障等级', '故障代码','开关状态', '总电流[A]','总电压[V]','充电状态', '单体压差', 'SOC[%]','SOH[%]']
  179. i=0
  180. CellUNum = 0
  181. CellTNum = 0
  182. OtherTNumm = 0
  183. st = time.time()
  184. for line in DBManager._download_json_data(urls):
  185. et = time.time()
  186. if i==0:
  187. data_blocks,CellUNum,CellTNum,OtherTNumm = DBManager._convert_to_dataframe_bms(line, mode)
  188. i+=1
  189. continue
  190. try:
  191. data_block,CellUNum,CellTNum,OtherTNumm = DBManager._convert_to_dataframe_bms(line, mode)
  192. except:
  193. continue
  194. try:
  195. data_blocks = np.concatenate((data_blocks,data_block),axis=0)
  196. except Exception as e:
  197. if 'all the input array dimensions for the concatenation axis must match exactly' in str(e) or \
  198. 'all the input array dimensions except for the concatenation axis must match exactly' in str(e):
  199. pass
  200. else:
  201. pdb.set_trace()
  202. raise e
  203. # print('\r'+str(i),end=" ")
  204. # print(data_block)
  205. # print(urls)
  206. # print(time.time()-et)
  207. i+=1
  208. name_var = DBManager._get_var_name(CellUNum,CellTNum,OtherTNumm)
  209. name_const.extend(name_var)
  210. columns_name = name_const
  211. if i==0:
  212. data_blocks = []
  213. df_all = pd.DataFrame(columns=columns_name,data=data_blocks)
  214. if not df_all.empty:
  215. df_all.loc[:,'时间戳'] = df_all.loc[:,'时间戳'].apply(lambda x:time.strftime('%Y-%m-%d %H:%M:%S',time.localtime(int(x)/1000)))
  216. return df_all
  217. elif type_name =='gps':
  218. if mode == 0:
  219. df_all = pd.DataFrame(columns=['时间戳','定位类型', '卫星数','纬度','经度','速度[km/h]','海拔','航向'])
  220. elif mode == 1:
  221. df_all = pd.DataFrame(columns=['时间戳','定位类型', '纬度','经度','速度[km/h]','有效位'])
  222. for line in DBManager._download_json_data(urls):
  223. df_add = DBManager._convert_to_dataframe_gps(line, mode)
  224. df_all = df_all.append(df_add,ignore_index=True)
  225. if not df_all.empty:
  226. df_all.loc[:,'时间戳'] = df_all.loc[:,'时间戳'].apply(lambda x:time.strftime('%Y-%m-%d %H:%M:%S',time.localtime(int(x)/1000)))
  227. return df_all
  228. elif type_name =='system':
  229. if mode == 0:
  230. df_all = pd.DataFrame(columns=['时间戳','加热目标温度', '加热超时','租赁开始时间','租赁天数','bms上传周期','gps上传周期'])
  231. elif mode == 1:
  232. df_all = pd.DataFrame()
  233. for line in DBManager._download_json_data(urls):
  234. df_add = DBManager._convert_to_dataframe_system(line, mode)
  235. df_all = df_all.append(df_add,ignore_index=True)
  236. if not df_all.empty:
  237. df_all.loc[:,'时间戳'] = df_all.loc[:,'时间戳'].apply(lambda x:time.strftime('%Y-%m-%d %H:%M:%S',time.localtime(int(x)/1000)))
  238. return df_all
  239. elif type_name =='accum':
  240. if mode == 0:
  241. df_all = pd.DataFrame(columns=['时间戳','SOH未标定时间', '累计充电电量','累计充电能量','累计放电电量','累计放电能量',
  242. '累计高温充电电量', '累计高温充电能量'])
  243. elif mode == 1:
  244. df_all = pd.DataFrame(columns=['时间戳','累计充电电量','累计充电能量','累计放电电量','累计放电能量', '累积里程'])
  245. for line in DBManager._download_json_data(urls):
  246. df_add = DBManager._convert_to_dataframe_accum(line, mode)
  247. df_all = df_all.append(df_add,ignore_index=True)
  248. if not df_all.empty:
  249. df_all.loc[:,'时间戳'] = df_all.loc[:,'时间戳'].apply(lambda x:time.strftime('%Y-%m-%d %H:%M:%S',time.localtime(int(x)/1000)))
  250. return df_all
  251. def get_data(self, url='http://172.16.126.13/store/load?dataType={}&limit=0&sn={}', sn='', start_time='', end_time='',
  252. data_groups=['bms', 'gps']):
  253. '''
  254. 获取指定 sn 和起止日期的bms和gps数据.
  255. 添加了重试机制。
  256. --------------输入参数------------
  257. url:数据获取url, 可采用默认值
  258. sn: str, 电池sn号
  259. start_time: str, 开始时间
  260. end_time: str, 结束时间
  261. data_groups: 选择需要获取的数据组,可填入多个字符串(默认只获取bms和gps数据)
  262. bms: bms数据
  263. gps:gps数据
  264. system:system数据
  265. accum:accum数据
  266. --------------输出参数------------
  267. df_data: {'bms':dataframe, 'gps':dataframe, 'system':dataframe, ;accum':dataframe}
  268. '''
  269. if len(set(data_groups) - (set(data_groups) and set(['bms', 'gps', 'system', 'accum']))) > 0:
  270. raise Exception("data_groups 参数错误")
  271. # mode: 0:正常取数; 1:7255 取数
  272. if sn[0:2] == 'UD' or sn[0:2] == 'MG':
  273. mode = 1
  274. else:
  275. mode = 0
  276. bms_all_data = pd.DataFrame()
  277. gps_all_data = pd.DataFrame()
  278. system_all_data = pd.DataFrame()
  279. accum_all_data = pd.DataFrame()
  280. maxnum = (datetime.datetime.strptime(end_time, "%Y-%m-%d %H:%M:%S") - datetime.datetime.strptime(start_time, "%Y-%m-%d %H:%M:%S")).days +1
  281. print("### start to get data {} from {} to {}".format(sn, start_time, end_time))
  282. # 为避免chunkEncodingError错误,数据每天获取一次,然后将每天的数据合并,得到最终的数据
  283. for j in range(int(maxnum)):
  284. timefrom = datetime.datetime.strptime(start_time, "%Y-%m-%d %H:%M:%S")+ datetime.timedelta(days=j)
  285. timeto = datetime.datetime.strptime(start_time, "%Y-%m-%d %H:%M:%S")+ datetime.timedelta(days=j+1)
  286. #滴滴的数据sub=0
  287. if timefrom.strftime('%Y-%m-%d %H:%M:%S') >= end_time:
  288. break
  289. elif timeto.strftime('%Y-%m-%d %H:%M:%S') > end_time:
  290. timeto = datetime.datetime.strptime(end_time, '%Y-%m-%d %H:%M:%S')
  291. #print('{}_{}_----getting data----'.format(sn, timefrom))
  292. bms_data = pd.DataFrame()
  293. gps_data = pd.DataFrame()
  294. system_data = pd.DataFrame()
  295. accum_data = pd.DataFrame()
  296. while True:
  297. try:
  298. print('\r' + "# get data from {} to {}.........".format(str(timefrom), str(timeto)), end=" ")
  299. for data_group in data_groups:
  300. if data_group == 'bms':
  301. file_url = url.format(12, sn) + "&from="+timefrom.strftime('%Y-%m-%d %H:%M:%S')+"&to="+timeto.strftime('%Y-%m-%d %H:%M:%S')
  302. bms_data = DBManager._get_data(file_url,'bms',mode)
  303. if data_group == 'gps':
  304. file_url = url.format(16, sn) + "&from="+timefrom.strftime('%Y-%m-%d %H:%M:%S')+"&to="+timeto.strftime('%Y-%m-%d %H:%M:%S')
  305. gps_data = DBManager._get_data(file_url,'gps',mode)
  306. if data_group == 'system':
  307. file_url = url.format(13, sn) + "&from="+timefrom.strftime('%Y-%m-%d %H:%M:%S')+"&to="+timeto.strftime('%Y-%m-%d %H:%M:%S')
  308. system_data = DBManager._get_data(file_url,'system',mode)
  309. if data_group == 'accum':
  310. file_url = url.format(23, sn) + "&from="+timefrom.strftime('%Y-%m-%d %H:%M:%S')+"&to="+timeto.strftime('%Y-%m-%d %H:%M:%S')
  311. accum_data = DBManager._get_data(file_url,'accum',mode)
  312. except Exception as e:
  313. if 'Connection broken' in str(e):
  314. continue
  315. else:
  316. raise Exception
  317. else:
  318. bms_all_data = pd.concat([bms_all_data, bms_data], ignore_index=True)
  319. gps_all_data = pd.concat([gps_all_data, gps_data], ignore_index=True)
  320. system_all_data = pd.concat([system_all_data, system_data], ignore_index=True)
  321. accum_all_data = pd.concat([accum_all_data, accum_data], ignore_index=True)
  322. break
  323. bms_all_data = bms_all_data.reset_index(drop=True)
  324. gps_all_data = gps_all_data.reset_index(drop=True)
  325. system_all_data = system_all_data.reset_index(drop=True)
  326. accum_all_data = accum_all_data.reset_index(drop=True)
  327. print('\nall data-getting done, bms_count is {}, gps_count is {}, system_count is {}, accum_count is {} \n'.format(
  328. str(len(bms_all_data)), str(len(gps_all_data)), str(len(system_all_data)), str(len(accum_all_data))))
  329. return {'bms':bms_all_data, 'gps':gps_all_data, 'system':system_all_data, 'accum':accum_all_data}