-
Notifications
You must be signed in to change notification settings - Fork 1
/
Copy pathscrapeSportsBookNCAAHalfLines.py
65 lines (53 loc) · 2.04 KB
/
scrapeSportsBookNCAAHalfLines.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
__author__ = 'tanyacashorali'
import urllib2
import time
import re
import random
import datetime
import os
import sqlite3
import pandas as pd
from urlparse import urlparse
from bs4 import BeautifulSoup as bs
from datetime import date, timedelta
db = sqlite3.connect('/home/ec2-user/sports/sports.db')
x=random.randint(1, 20)
time.sleep(x)
url = urllib2.urlopen('https://www.sportsbook.ag/sbk/sportsbook4/ncaa-basketball-betting/2nd-half-ncaa-basketball.sbk')
soup = bs(url.read(), ['fast', 'lxml'])
divs=soup.findAll('div', {'class':'col-sm-12 eventbox'})
awayTeams=[d.findAll('span', {'id':'awayTeamName'}) for d in divs]
homeTeams=[d.findAll('span', {'id':'homeTeamName'}) for d in divs]
awayTeams=[a[0].text for a in awayTeams]
homeTeams=[h[0].text for h in homeTeams]
market=[d.findAll('div', {'class':'market'}) for d in divs]
the_lines=[m[0].text for m in market]
the_spreads=[m[1].text for m in market]
lines = []
spreads = []
for i in range(0, len(the_lines)):
try:
lines.append(re.search('(\d+\\.?\d+)\\(', the_lines[i]).group(1))
spreads.append(re.search('([+-]\d+\\.?\d?)\\(', the_spreads[i]).group(1))
except:
next
#today = date.today()
#today = today.strftime("%m/%d/%Y")
today = str(datetime.datetime.now() - timedelta(hours=2))[0:10]
today = time.strftime("%m/%d/%Y", time.strptime(today, '%Y-%m-%d'))
date_time = str(datetime.datetime.now())
for i in range(0, len(lines)):
try:
with db:
db.execute('''INSERT INTO NCAASBHalfLines(away_team, home_team, line, spread, game_date, game_time) VALUES(?,?,?,?,?,?)''', (awayTeams[i], homeTeams[i], lines[i], spreads[i], today, date_time))
db.commit()
except sqlite3.IntegrityError:
print 'Record Exists'
for i in range(0, len(lines)):
try:
with db:
db.execute('''INSERT INTO NCAASBteamlookup(sb_team, espn_abbr) VALUES (?,?)''', (awayTeams[i], None))
db.execute('''INSERT INTO NCAASBteamlookup(sb_team, espn_abbr) VALUES (?,?)''', (homeTeams[i], None))
except:
print 'Record Exists'
db.close()