first commit yay
This commit is contained in:
parent
7ecfb1e29a
commit
e6fc19ca0d
3 changed files with 50 additions and 0 deletions
2
.gitignore
vendored
Normal file
2
.gitignore
vendored
Normal file
|
@ -0,0 +1,2 @@
|
|||
*.pyc
|
||||
__pycache__
|
2
README.md
Normal file
2
README.md
Normal file
|
@ -0,0 +1,2 @@
|
|||
# NAIA Mens Volleyball Stats
|
||||
I played collegiate volleyball about 7-8 years ago now. I am writing this program to make sure there are offline archived copies of mens volleyball stats for Cardinal Stritch University. Releasing with GPL in case anyone wants to modify for their own team.
|
46
pull_box_score.py
Executable file
46
pull_box_score.py
Executable file
|
@ -0,0 +1,46 @@
|
|||
#!/usr/bin/env python
|
||||
|
||||
from bs4 import BeautifulSoup
|
||||
import requests
|
||||
|
||||
#### FIRST THREE YEARS 2010/2011/2012 ARE DIFFERENT WAYS TO RETRIEVE THAN 13-17
|
||||
|
||||
|
||||
|
||||
class Old_Stats:
|
||||
'Retrieve the mens volleyball statistics data from years 2010, 2011, 2012 for MAMVIC NAIA Cardinal Stritch'
|
||||
|
||||
# return list of years of stat data
|
||||
def years(self):
|
||||
|
||||
start_year = 2010
|
||||
end_year = 2012
|
||||
|
||||
yearl = []
|
||||
for year in range(start_year, end_year + 1):
|
||||
yearl.append(year)
|
||||
return yearl
|
||||
|
||||
def base_urls(self):
|
||||
self.sport_url = '/teamstat.htm?path=mvball'
|
||||
base_urll = []
|
||||
for year in range(0, len(self.years())):
|
||||
self.base_url = 'static.stritchwolves.com/custompages/MVB/' + str(self.years()[year])
|
||||
base_urll.append(self.base_url + self.sport_url)
|
||||
return base_urll
|
||||
|
||||
def get_box_score_links(self):
|
||||
|
||||
link_list = []
|
||||
|
||||
for url_step in range(0, len(self.base_urls())):
|
||||
r = requests.get('http://' + self.base_urls()[url_step])
|
||||
data = r.text
|
||||
soup = BeautifulSoup(data, 'lxml')
|
||||
for link in soup.find_all('a'):
|
||||
link_list.append('http://' + self.base_urls()[url_step].replace(self.sport_url, '') + '/' + link.get('href'))
|
||||
return link_list
|
||||
|
||||
old_stats = Old_Stats()
|
||||
|
||||
print old_stats.get_box_score_links()
|
Loading…
Add table
Reference in a new issue