Skip to content

Instantly share code, notes, and snippets.

@ekiro
Created December 28, 2014 19:17
Show Gist options
  • Save ekiro/80c7e2539f7023a6a08d to your computer and use it in GitHub Desktop.
Save ekiro/80c7e2539f7023a6a08d to your computer and use it in GitHub Desktop.
#!/usr/bin/env python
# -*- coding: utf-8 -*-
from gevent import monkey
monkey.patch_all()
import re
import time
import requests
from gevent.pool import Pool
s = requests.Session()
def get_info():
res = s.get('http://77.252.189.162/index.php?co=rozklady&submenu=tabliczka&'
'nr_linii=A4&nr_przyst=1&id_trasy=13077')
ids = re.findall(ur'id_kursu=(\d+)', res.text)
base_url = 'http://77.252.189.162/rozklad/pokaz_kurs.php?id_kursu=%s'
urls = [base_url % id_ for id_ in ids]
p = Pool(25)
ret = p.map(s.get, urls)
return ret
if __name__ == '__main__':
start = time.time()
data = get_info()
print len(data), time.time() - start
Sign up for free to join this conversation on GitHub. Already have an account? Sign in to comment