source.py 7.3 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200
  1. from class_xml import XML
  2. import config
  3. import datetime
  4. from itertools import chain
  5. # SOURCE CLASSES
  6. class Source:
  7. pass
  8. class SourceProvider:
  9. def dic_of_names(self):
  10. """Returns a dictionary mapping ids to name (for find.py)"""
  11. return []
  12. def dic_of_positions(self):
  13. """Returns a dictionary mapping ids to position (for geocoding.py)"""
  14. return []
  15. def sources_of_ids(self, ids):
  16. """Returns a generator of Source these ids"""
  17. return []
  18. ############## RATP ##############
  19. class Source_ratp(Source):
  20. def __init__(self, ident, status, message):
  21. self.source = 'ratp_trafic'
  22. self.id = ident
  23. self.status = status
  24. self.message = message
  25. def problem(self):
  26. return self.status != 'normal'
  27. class SourceProvider_ratp(SourceProvider):
  28. def __init__(self):
  29. self.names = None
  30. self.positions = None
  31. def dic_of_names(self):
  32. if not self.names:
  33. print('Téléchargement de la liste des lignes ratp...')
  34. xml = XML(url='http://www.ratp.fr/meteo/', lang='html')
  35. self.names = {tag['id']: tag['id'].replace('_', ' ') for tag in xml.data.select('.encadre_ligne')}
  36. return self.names
  37. def dic_of_positions(self):
  38. return {} # TODO API ratp
  39. def sources_of_ids(self, ids):
  40. for tag in XML(url="http://www.ratp.fr/meteo/", lang="html").data.select('div.encadre_ligne'):
  41. if tag['id'] in ids:
  42. yield Source_ratp(tag['id'], tag.img['alt'],\
  43. tag['id'].replace('_', ' ') + ' : ' + tag.select('span.perturb_message')[0].string)
  44. ############## JCDECAUX_VLS ##############
  45. class Source_jcdecaux_vls(Source):
  46. def __init__(self, ident, nom, timestamp, status):
  47. self.source = 'jcdecaux_vls'
  48. self.id = ident
  49. self.status = status # TODO dans l'API pour 1 station il semble que c'est toujours OPEN :-(
  50. self.date = datetime.datetime.fromtimestamp(int(timestamp)/1000).strftime('à %Hh%M le %d/%m')
  51. if status != "OPEN":
  52. self.message = 'Station vélo ' + nom.lower() + ' ' + self.date + ' : fermée !'
  53. else:
  54. self.message = None
  55. def problem(self):
  56. return self.status != "OPEN"
  57. class Source_jcdecaux_vls_full(Source_jcdecaux_vls):
  58. def __init__(self, ident, nom, timestamp, places, status):
  59. super(Source_jcdecaux_vls_full, self).__init__(ident, nom, timestamp, status)
  60. self.id += "_full"
  61. self.places = int(places)
  62. if not self.message:
  63. self.message = 'Station vélo ' + nom.lower() + ' ' + self.date + ' : '
  64. if self.places == 0:
  65. self.message += 'plus de place !'
  66. elif self.places == 1:
  67. self.message += 'plus qu\'une place !'
  68. else:
  69. self.message += 'plus que ' + places + ' places disponibles !'
  70. def problem(self):
  71. return super(Source_jcdecaux_vls_full, self).problem() or self.places <= config.sources_params['jcdecaux_vls']['limit_full']
  72. class Source_jcdecaux_vls_empty(Source_jcdecaux_vls):
  73. def __init__(self, ident, nom, timestamp, bikes, status):
  74. super(Source_jcdecaux_vls_empty, self).__init__(ident, nom, timestamp, status)
  75. self.id += "_empty"
  76. self.bikes = int(bikes)
  77. if not self.message:
  78. self.message = 'Station vélo ' + nom.lower() + ' ' + self.date + ' : '
  79. if self.bikes == 0:
  80. self.message += 'plus de vélo !'
  81. elif self.bikes == 1:
  82. self.message += 'plus qu\'un vélo !'
  83. else:
  84. self.message += 'plus que ' + bikes + ' vélos !'
  85. def problem(self):
  86. return super(Source_jcdecaux_vls_empty, self).problem() or self.bikes <= config.sources_params['jcdecaux_vls']['limit_empty']
  87. class SourceProvider_jcdecaux_vls(SourceProvider):
  88. def __init__(self):
  89. self.names = {}
  90. self.positions = None
  91. def dic_of_names(self, contract=None):
  92. contract = contract or 'all'
  93. if contract not in self.names:
  94. print('Téléchargement de la liste des stations pour le contrat ' + contract + '...')
  95. if contract != 'all':
  96. xml = XML(url='https://api.jcdecaux.com/vls/v1/stations?contract=' + contract + '&apiKey=' + config.api_key['jcdecaux_vls'], lang='json')
  97. else:
  98. xml = XML(url='https://api.jcdecaux.com/vls/v1/stations?apiKey=' + config.api_key['jcdecaux_vls'], lang='json')
  99. self.names = {}
  100. for sta in xml.data.json.find_all("item", recursive=False):
  101. self.names[sta.contract_name.string.lower() + '_' + sta.number.string] =\
  102. sta.find('name').string + ' (' + sta.address.get_text() + ')'
  103. # we use find('name') because .name is the current tag name
  104. return self.names
  105. def dic_of_positions(self):
  106. if not self.positions:
  107. print('Téléchargement de la liste des stations...')
  108. xml = XML(url='https://api.jcdecaux.com/vls/v1/stations?apiKey=' + config.api_key['jcdecaux_vls'], lang='json')
  109. self.positions = {}
  110. for sta in xml.data.json.find_all("item", recursive=False):
  111. self.positions[sta.contract_name.string.lower() + '_' + sta.number.string + '_' + 'full'] =\
  112. (sta.lat.string, sta.lng.string)
  113. # we use find('name') because .name is the current tag name
  114. return self.positions
  115. def sources_of_ids(self, ids):
  116. ids_set = set(map(lambda s : s.rsplit('_', 1)[0], ids))
  117. for station in ids_set:
  118. (contract, number) = list(station.split('_'))
  119. xml = XML(url="https://api.jcdecaux.com/vls/v1/stations/" + number + "?contract=" + contract + "&apiKey="+config.api_key['jcdecaux_vls'], lang="json")
  120. tag = xml.data.json
  121. if contract + '_' + number + '_full' in ids:
  122. yield Source_jcdecaux_vls_full(contract + '_' + number, tag.find('name').string, tag.last_update.string, tag.available_bike_stands.string, tag.status.string)
  123. if contract + '_' + number + '_empty' in ids:
  124. yield Source_jcdecaux_vls_empty(contract + '_' + number, tag.find('name').string, tag.last_update.string, tag.available_bikes.string, tag.status.string)
  125. ############## TRANSILIEN ##############
  126. class Source_transilien(Source):
  127. def __init__(self, ident, message):
  128. self.source = 'transilien'
  129. self.id = ident
  130. self.message = message
  131. def problem(self):
  132. return self.message != 'Trafic normal'
  133. class SourceProvider_transilien(SourceProvider):
  134. def __init__(self):
  135. self.names = None
  136. self.positions = None
  137. def dic_of_names(self):
  138. if not self.names:
  139. print('Téléchargement de la liste des lignes transilien...')
  140. xml = XML(url='http://www.transilien.com/info-trafic/temps-reel', lang='html')
  141. self.names = {}
  142. for line in xml.data.select('div.b_info_trafic')[0].find_all('div', recursive=False):
  143. id = line.select('.picto-transport')[1].get_text()
  144. self.names[id] = id.replace('-', ' ')
  145. return self.names
  146. def dic_of_positions(self):
  147. return {} # TODO
  148. def sources_of_ids(self, ids):
  149. xml = XML(url="http://www.transilien.com/info-trafic/temps-reel", lang="html").data
  150. container = xml.select('div.b_info_trafic')[0]
  151. for line in container.find_all('div', recursive=False):
  152. id = line.select('.picto-transport')[1].get_text()
  153. if id in ids:
  154. message = ""
  155. for c in line.select_one('.title').children:
  156. if c.name: # a tag
  157. if 'picto-transport' not in c.attrs.get('class', ''):
  158. message += c.get_text()
  159. else: # a string
  160. message += c
  161. for det in line.select('.item-disruption'):
  162. message += det.get_text()
  163. message = " ".join(message.split()) # delete multiple spaces
  164. yield Source_transilien(id, message)