diff --git a/.circleci/config.yml b/.circleci/config.yml new file mode 100644 index 00000000..1ab1287e --- /dev/null +++ b/.circleci/config.yml @@ -0,0 +1,40 @@ +version: 2.1 + +orbs: + python: circleci/python@1.3.2 + docker: circleci/docker@1.5.0 + +jobs: + build-and-test: + executor: python/default + environment: + TEST: True + steps: + - checkout + - setup_remote_docker + - docker/install-docker-compose + - run: + command: | + python -m pip install --upgrade pip + pip install pylint + pip install -r requirements.txt + pip install scrapy-autounit + name: Install dependencies + - run: + command: | + scrapy crawl espn-live + scrapy crawl espn-players + python3 -m unittest discover autounit/tests/ + name: Crawler Test with autounit + - run: + command: | + pylint app -E + pylint app --exit-zero + name: Lint with pylint + - run: + name: Test with pytest + command: sudo docker-compose -f docker/docker-compose-test.yaml up --build --exit-code-from test +workflows: + main: + jobs: + - build-and-test diff --git a/.github/workflows/python-app.yml b/.github/workflows/python-app.yml deleted file mode 100644 index dc6b1694..00000000 --- a/.github/workflows/python-app.yml +++ /dev/null @@ -1,38 +0,0 @@ -# This workflow will install Python dependencies, run tests and lint with a single version of Python -# For more information see: https://help.github.com/actions/language-and-framework-guides/using-python-with-github-actions - -name: Python application - -on: - push: - branches: [ master , 'feature-*'] - pull_request: - branches: [ master , 'feature-*'] - -jobs: - build: - strategy: - matrix: - platform: [ubuntu-latest, windows-latest, macos-latest] - runs-on: ${{ matrix.platform }} - - steps: - - uses: actions/checkout@v2 - - name: Set up Python 3.8 - uses: actions/setup-python@v2 - with: - python-version: 3.8 - - name: Install dependencies - run: | - python -m pip install --upgrade pip - pip install pylint pytest - pip install -r requirements.txt - - name: Lint with pylint - run: | - # stop the build if there are Python syntax errors or undefined names - pylint app -E - # exit-zero treats all errors as warnings. The GitHub editor is 127 chars wide - pylint app --exit-zero - - name: Test with pytest - run: | - pytest diff --git a/.gitignore b/.gitignore index 1b77d315..0d9261e0 100644 --- a/.gitignore +++ b/.gitignore @@ -67,6 +67,7 @@ instance/ # Scrapy stuff: .scrapy +autounit # Sphinx documentation docs/_build/ diff --git a/Dockerfile.development b/Dockerfile.development deleted file mode 100644 index 3396e521..00000000 --- a/Dockerfile.development +++ /dev/null @@ -1,16 +0,0 @@ - -FROM python:3.8-slim as build - -WORKDIR / - -COPY ./requirements.txt ./requirements.txt -RUN apt-get update && \ - apt-get -y install gcc mono-mcs && \ - rm -rf /var/lib/apt/lists/* -RUN pip install -r requirements.txt - -COPY ./app /app -COPY ./crawler /crawler -COPY ./scrapy.cfg /scrapy.cfg - -ENTRYPOINT ["uvicorn", "app.main:app"] \ No newline at end of file diff --git a/README.md b/README.md old mode 100644 new mode 100755 index 1c750ad8..d15428e2 --- a/README.md +++ b/README.md @@ -8,7 +8,7 @@ In the past year or so fantasy cricket has been getting a lot of traction and wi 1. [FastAPI](https://fastapi.tiangolo.com/) 2. [sklearn](https://scikit-learn.org/stable/) -3. [pycricbuzz](https://github.com/codophobia/pycricbuzz) +3. [scrapyrt](https://scrapyrt.readthedocs.io/en/stable/) 4. [scrapy](https://docs.scrapy.org/en/latest/) Install using
@@ -16,7 +16,7 @@ Install using
pip3 install -r requirements.txt ``` -## I want to run your project +## Local Development To run our project follow these steps @@ -27,24 +27,57 @@ To run our project follow these steps cd Best11-Fantasycricket ``` -3. Run the model : +3. + **Linux and MACOS** + + 1. Type `nano /etc/hosts` on your terminal or open `/etc/hosts` on your prefered editor + + **Windows** + 1. Open `C:\windows\system32\drivers\etc\hosts` in your prefered editor + + + 2. And add the below line to the the file and save + + `127.0.0.1 espncricinfo` + + **OR** + + 1. Open `app/fantasy_cricket/scrapyrt_client.py` in your prefered editor + + 2. Change line `16` to + + ```python + self.url = "http://localhost:9080/crawl.json" + ``` + +4. Open a tab on your terminal and run `uvicorn app.main:app` -5. `Open http://localhost:8000/` and voila!! +5. Open another tab on your terminal and run + +`scrapyrt` + + +6. Open `http://localhost:8000/` and voila!! + +**Note:** +Visit `http://localhost:9080/crawl.json` with the correct queries to see the crawler api ### Docker 1. Follow the steps: - ```bash - docker build -t best11fantasycricket:latest "." - ``` ```bash - docker-compose up + docker build -t espncricinfo:latest "." -f docker/espncricinfo/Dockerfile + docker build -t best11:latest "." -f docker/11tastic/Dockerfile + docker-compose -f docker/docker-compose.yaml up ``` -2. Visit `http://localhost:8080/` +2. Visit `http://localhost:8080/` to see the website in action + +**Note** + Visit `http://localhost:9080/crawl.json` with the correct queries to see the crawler api ## How do I contribute to this project???? @@ -69,9 +102,9 @@ If you have any questions regarding our project , you can contact any of the mai ### Acknowledgements -1. Special thanks to [scientes](https://github.com/scientes) for setting up the basic webcrawler +1. Special thanks to [scientes](https://github.com/scientes) for allowing us to use the server to host the website -2. We would like to thank [Howstat](http://www.howstat.com/cricket/home.asp) for their amazing website with daily updates and availabilty to scrape +2. We would like to thank [espncricinfo](https://www.espncricinfo.com/) for their amazing website with daily updates and availabilty to scrape If you liked our project we would really appreciate you starring this repo. diff --git a/app/__init__.py b/app/__init__.py old mode 100644 new mode 100755 diff --git a/app/fantasy_cricket/__init__.py b/app/fantasy_cricket/__init__.py old mode 100644 new mode 100755 diff --git a/app/fantasy_cricket/data/flags.json b/app/fantasy_cricket/data/flags.json deleted file mode 100644 index 91df0982..00000000 --- a/app/fantasy_cricket/data/flags.json +++ /dev/null @@ -1,37 +0,0 @@ -{ - "countries": { - "India": { - "flag": "" - }, - "England": { - "flag": "" - }, - "Australia": { - "flag": "" - }, - "Bangladesh": { - "flag": "" - }, - "New Zealand": { - "flag": "" - }, - "South Africa": { - "flag": "" - }, - "West Indies": { - "flag": "" - }, - "Pakistan": { - "flag": "" - }, - "Ireland": { - "flag": "" - }, - "Afghanistan": { - "flag": "" - }, - "Sri Lanka": { - "flag": "" - } - } -} \ No newline at end of file diff --git a/app/fantasy_cricket/fantasy_leagues.py b/app/fantasy_cricket/fantasy_leagues.py new file mode 100644 index 00000000..7409a656 --- /dev/null +++ b/app/fantasy_cricket/fantasy_leagues.py @@ -0,0 +1,37 @@ +"""This module defines all supported fantasy_leagues and their functionality. +All browsers must inherit from app.fantasy_cricket.Team`. +""" +from app.fantasy_cricket.team import Team + + +class Dream11(Team): + """Dream11 League + + Supported formats: + * ODI + * T20 + * TEST + """ + + name = "Dream11" + + batting_dict = { + "runs": [1, 1, 1], + "boundaries": [1, 1, 1], + "sixes": [2, 2, 2], + "50": [4, 4, 8], + "100": [8, 8, 16], + "duck": [-4, -3, -2], + } + + bowling_dict = { + "wicket": [16, 25, 25], + "4-wicket-haul": [4, 4, 8], + "5-wicket-haul": [8, 8, 16], + "Maiden": [0, 8, 4], + } + + wk_dict = { + "Catch": [8, 8, 8], + "Stump": [12, 12, 12], + } diff --git a/app/fantasy_cricket/matches.py b/app/fantasy_cricket/matches.py new file mode 100755 index 00000000..f2383287 --- /dev/null +++ b/app/fantasy_cricket/matches.py @@ -0,0 +1,56 @@ +""" +The module is defined to get upcoming match data of the next 2 days +""" + +from typing import List +from app.fantasy_cricket.scrapyrt_client import EspnClient + + +class Matches: + """ + A class to get upcoming live match data of the next 2 days + + """ + + def __init__(self) -> None: + + self.espn = EspnClient() + + def get_upcoming_match(self): + """ + Gets current matches dict + """ + matches = [] + for match in self.espn.get_upcoming_dets(): + if match["team1_squad"] != [] and match["team2_squad"] != []: + matches.append( + { + "team1": match["team1"], + "team2": match["team2"], + "flag_team1": "https://a.espncdn.com/i/teamlogos/cricket/500/" + + match["team1_id"] + + ".png", + "flag_team2": "https://a.espncdn.com/i/teamlogos/cricket/500/" + + match["team2_id"] + + ".png", + } + ) + + return matches + + def get_squad_match_type(self, teams: List[str]): + """ + Gets squad and match_class based on teams + """ + + for match in self.espn.get_upcoming_dets(): + + if match["team1"] == teams[0] and match["team2"] == teams[1]: + match_det = { + "team1_squad": match["team1_squad"], + "team2_squad": match["team2_squad"], + "match_type": match["match_id"], + } + break + + return match_det diff --git a/app/fantasy_cricket/scrapyrt_client.py b/app/fantasy_cricket/scrapyrt_client.py new file mode 100755 index 00000000..4091466c --- /dev/null +++ b/app/fantasy_cricket/scrapyrt_client.py @@ -0,0 +1,112 @@ +""" +This module is built as an api wrapper around the scrapyrt process +""" + +from typing import List +import requests + + +class EspnClient: + """ + A simple wrapper built on the scrapyrt api process + """ + + def __init__(self) -> None: + + self.url = "http://espncricinfo:9080/crawl.json" + + def get_upcoming_dets(self): + """ + Gets the upcoming matches from the scrapyrt api + """ + matches = requests.get( + self.url, params={"spider_name": "espn-live", "start_requests": "true"} + ) + + return matches.json()["items"] + + def get_player_dets(self, players: List[str], team: str): + """ + Gets and parses player info from the scrapyrt api + """ + player_data = [] + for player in players: + player_data.append( + ( + requests.get( + self.url, + params={ + "spider_name": "espn-players", + "url": "https://www.espncricinfo.com/ci/content/player/" + + str(player) + + ".html", + }, + ).json()["items"][0], + player, + ) + ) + for player, player_id in player_data: + if not player["role"]: + continue + if "wicketkeeper" in player["role"].lower(): + player["role"] = "wicket-keeper" + elif "allrounder" in player["role"].lower(): + player["role"] = "all-rounder" + elif "bowler" in player["role"].lower(): + player["role"] = "bowler" + else: + player["role"] = "batsman" + player["team"] = team + player["player_id"] = player_id + + player_data = [player for player, _ in player_data if player["role"]] + return player_data + + def get_match_det(self, player_id: str, role: str, match_type: str): + """ + Gets and parses match details got fr0om the scrapyrt api + """ + role_filter_dict = { + "batsman": ["Catch", "Stump", "wicket", "Maiden"], + "bowler": ["Catch", "Stump", "runs", "boundaries", "sixes"], + "all-rounder": ["Catch", "Stump"], + "wicket-keeper": ["wicket", "Maiden"], + } + match_det = requests.get( + self.url, + params={ + "spider_name": "espn-matches", + "url": "https://stats.espncricinfo.com/ci/engine/player/" + + player_id + + ".html?class=" + + match_type + + ";orderby=start;orderbyad=reverse;template=results;type=allround;view=match", + }, + ).json()["items"] + for i, _ in enumerate(match_det): + match_det[i] = { + key: val + for key, val in match_det[i].items() + if key not in role_filter_dict[role] + } + if role in ["batsman", "all-rounder", "wicket-keeper"]: + match_det[i]["100"] = match_det[i]["50"] = match_det[i]["duck"] = 0 + if not match_det[i]["runs"]: + match_det[i]["runs"] = match_det[i]["boundaries"] = match_det[i][ + "sixes" + ] = 0 + elif match_det[i]["runs"] >= 100: + match_det[i]["100"] = 1 + elif match_det[i]["runs"] >= 50: + match_det[i]["50"] = 1 + elif match_det[i]["runs"] == 0: + match_det[i]["duck"] = 1 + if role in ["bowler", "all-rounder"]: + match_det[i]["4-wicket-haul"] = match_det[i]["5-wicket-haul"] = 0 + if not match_det[i]["wicket"]: + match_det[i]["wicket"] = match_det[i]["Maiden"] = 0 + elif match_det[i]["wicket"] >= 5: + match_det[i]["5-wicket-haul"] = 1 + elif match_det[i]["wicket"] >= 4: + match_det[i]["4-wicket-haul"] = 1 + return match_det diff --git a/app/fantasy_cricket/static/bat.png b/app/fantasy_cricket/static/bat.png deleted file mode 100644 index 4a495fb6..00000000 Binary files a/app/fantasy_cricket/static/bat.png and /dev/null differ diff --git a/app/fantasy_cricket/static/fonts/hackerspace.ttf b/app/fantasy_cricket/static/fonts/hackerspace.ttf old mode 100644 new mode 100755 diff --git a/app/fantasy_cricket/static/icon.png b/app/fantasy_cricket/static/icon.png deleted file mode 100644 index a81e1258..00000000 Binary files a/app/fantasy_cricket/static/icon.png and /dev/null differ diff --git a/app/fantasy_cricket/static/loading.gif b/app/fantasy_cricket/static/loading.gif deleted file mode 100644 index 05e1f570..00000000 Binary files a/app/fantasy_cricket/static/loading.gif and /dev/null differ diff --git a/app/fantasy_cricket/static/result1.jpg b/app/fantasy_cricket/static/result1.jpg deleted file mode 100644 index 98f91ca3..00000000 Binary files a/app/fantasy_cricket/static/result1.jpg and /dev/null differ diff --git a/app/fantasy_cricket/static/styles/style.css b/app/fantasy_cricket/static/styles/style.css deleted file mode 100644 index fb294015..00000000 --- a/app/fantasy_cricket/static/styles/style.css +++ /dev/null @@ -1,73 +0,0 @@ -/* This following style sheet is not being used */ -body { - background-image: url("../images/background1.jpg"); -} - -h1 { - text-align: center; - color: white; - font-size: 3em; - margin-top: 2.5em; -} - -h2 { - text-align: center; - color: white; - font-size: 2em; - margin-top: 3em; -} - -form { - margin-top: 1em; - margin-left: 4.5em; -} - -input { - position: absolute; - left: 44%; - border-radius: 5px; - border: 1px solid; - padding: 8px 6px; - line-height: 120%; -} - -.container { - display: grid; - grid-template-columns: auto auto auto auto; - grid-gap: 10px; - grid-row-gap: 40px; - padding: 10px; -} - -input:hover[type="submit"] { - color: white; - box-shadow: 0 5px 15px rgba(145, 92, 182, .4); -} - -.button { - position: absolute; - top: 450px; - left: 710px; -} - -p { - text-align: center; -} - -.custom-select { - width:200px; - position: absolute; - left: 43.5%; - text-align: center; - margin-top: 1.5em; -} - -select { - height:30px; - text-align: center; - border-radius: 3px; - font-family: Arial; - line-height:30px; - font-size: 1em; -} - diff --git a/app/fantasy_cricket/static/styles/style1.css b/app/fantasy_cricket/static/styles/style1.css old mode 100644 new mode 100755 index c714e50c..9e6516ba --- a/app/fantasy_cricket/static/styles/style1.css +++ b/app/fantasy_cricket/static/styles/style1.css @@ -1,5 +1,5 @@ .bgImage { - background-image: url("../result1.jpg") ; + background-image: url("https://user-images.githubusercontent.com/54945757/106836486-448fe600-66bf-11eb-9878-bb8e2237dd91.jpg") ; background-size:cover; position: fixed; left: 0; diff --git a/app/fantasy_cricket/static/styles/style2.css b/app/fantasy_cricket/static/styles/style2.css old mode 100644 new mode 100755 diff --git a/app/fantasy_cricket/team.py b/app/fantasy_cricket/team.py old mode 100644 new mode 100755 index 7587ebea..2135f474 --- a/app/fantasy_cricket/team.py +++ b/app/fantasy_cricket/team.py @@ -1,218 +1,124 @@ """ -This module defines the teams class which outputs the team for the match -and the Predict class which predicts the score based on the role -Copyright (C) 2020 Royston E Tauro & Sammith S Bharadwaj & Shreyas Raviprasad - This program is free software: you can redistribute it and/or modify - it under the terms of the GNU Affero General Public License as published - by the Free Software Foundation, either version 3 of the License, or - (at your option) any later version. - This program is distributed in the hope that it will be useful, - but WITHOUT ANY WARRANTY; without even the implied warranty of - MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the - GNU Affero General Public License for more details. - You should have received a copy of the GNU Affero General Public License - along with this program. If not, see . +This module defines the teams class which is generic over the classes in fantasy_leagues module """ -import json +from typing import List, Optional import numpy as np from sklearn.linear_model import LinearRegression +from app.fantasy_cricket.scrapyrt_client import EspnClient -class Teams: - """A team class which is defined as a base in predicting teams - * **get_match** : a dictionary which maps the match_id of the selected match - to the match name - * **match_id**: match_id of the match chosen by the user - * **match**: Match name of the selected match_id - * **team_dict**: dictionary which maps the team name to count of the players - selected from that team - *param Id: Id passed to select team for a match +class Team: + """ + A generic class built over the league classes in fantasy_leagues.py """ - def __init__(self, path): - self.path = path - self.team_dict = {} - self.player = {} - self.data = {} + name: Optional[str] = None - def get_max_players(self, role_dict, role): - """ - Returns max player for a particular role - :param role_dict : dict of the players mapped to the score for that role - :type dict( str : float) - :param player : dictionary of the selected players for the best11 - :type dict( str: float) - :param role : role of the player - :type str - :rtype: dict( str: float) - """ - if role_dict != {}: - max_score = { - "wk": [list(role_dict.keys())[0]], - "all": [list(role_dict.keys())[0]], - "bat": list(role_dict.keys())[:3], - "bowl": list(role_dict.keys())[:3], - } - team1,team2 = self.team_dict.keys() - names = max_score[role] - for name in names: - if team1 in role_dict[name]["team"]: - self.team_dict[team1] += 1 - elif team2 in role_dict[name]["team"]: - self.team_dict[team2] += 1 - if name not in self.player: - self.player[name] = role_dict[name] - - def get_restofteam(self, role_dict, reduntant, restteam): - """ - Returns the rest of the players who have not yet been chosen for the 11 - :param role_dict : dict of the players mapped to the score for that role - :type dict( str : float) - :param player : dictionary of the selected players for the best11 - :type dict( str: float) - :param redundant : selected players - :type list(str) - :param restteam: dict of the players left to be selected - :type dict( str: float) - :rtype dict( str: float) - """ - for i in role_dict: - if i not in self.player and i not in reduntant: - restteam[i] = role_dict[i] + batting_dict = {} + bowling_dict = {} + wk_dict = {} - restteam = sorted(restteam.items(), key=lambda x: x[1]["score"], reverse=True) - restteam = {i[0]: i[1] for i in restteam} - return restteam + def __init__(self, team1: str, team2: str) -> None: - def get_captain(self): - """ - Returns Captain and Vice Captain for the selected 11 - :param player: dictionary of the selected players for the best11 - :type dict( str : float) - :rtype: tuple(str,str) - """ - self.player = [ - i[0] - for i in sorted( - self.player.items(), key=lambda x: x[1]["score"], reverse=True - ) - ] - captain, vcaptain = self.player[0], self.player[1] - return captain, vcaptain + self.fantasy_team = {team1: [], team2: []} + self.team1 = team1 + self.team2 = team2 + self.espn = EspnClient() - def team(self): + def get_fantasy_team(self): """ - Returns Captain,Vicecaptain and teams for each role - :rtype: tuple( - str, - str, - dict( str : float), - dict( str : float), - dict( str : float), - dict( str : float), - ) + Get the fantasy team predicted including captains """ + vice_captain, captain = self.get_captain_vicecaptain() + for player in self.fantasy_team[self.team1] + self.fantasy_team[self.team2]: + if player == captain: + player["captain"] = "(C)" + elif player == vice_captain: + player["captain"] = "(VC)" + else: + player["captain"] = "" + return self.fantasy_team[self.team1] + self.fantasy_team[self.team2] - self.data = json.load(open(self.path)) - wkteam = batteam = ballteam = allteam = None - position_map = { - "wk": {"var": wkteam}, - "bat": {"var": batteam}, - "bowl": {"var": ballteam}, - "all": {"var": allteam}, - } - for role in position_map: - role_data = dict() - for player in self.data.keys(): - if self.data[player]["team"] not in self.team_dict.keys(): - self.team_dict[self.data[player]["team"]] = 0 - if self.data[player]["role"] == role: - role_data[player] = self.data[player] - position_map[role]["var"] = get_role_team(role_data) - self.get_max_players(position_map[role]["var"], role) - - count = 0 - redundant = [] - # print(position_map,self.team_dict) - maxi = len(self.player) - while count < 11 - maxi: - print(count) - restteam = {} - for role in position_map: - restteam = self.get_restofteam( - position_map[role]["var"], redundant, restteam - ) - new = list(restteam.keys())[0] - if list(self.team_dict.keys())[0] in restteam[new]["team"]: - if self.team_dict[list(self.team_dict.keys())[0]] < 7: - self.player[new] = restteam[new] - count += 1 - self.team_dict[list(self.team_dict.keys())[0]] += 1 - else: - redundant.append(new) - elif list(self.team_dict.keys())[1] in restteam[new]["team"]: - if self.team_dict[list(self.team_dict.keys())[1]] < 7: - self.player[new] = restteam[new] - count += 1 - self.team_dict[list(self.team_dict.keys())[1]] += 1 - else: - redundant.append(new) - # print(self.player) - return self.get_captain() - - -class Predict: - """ - A Predict class which predicts the score of the teams - * **value** : Number of matches to consider so as to predict the next match score - * **date** : Date the match to be predicted is going to be played - * **dates** : Dataframe of dates of all matches played by the player - :type : pandas.DataFrame() - * **result**: predicted score - * **player_name** : file name corresponding to the player name - :param : player : player name - :type : str - :param : role : player role - :type : str - :param : date : Date of the match - : type : str - """ - - value = 5 - - def __init__(self, player, data): - self.data = data - scores = self.get_scores(player) - self.result = self.predict(scores) - - def get_scores(self, player): + def get_captain_vicecaptain(self): """ - Returns scores in chronological order - :param : player : Player name - :type : String - rtype : list + Get captains and vice captains only """ - scores = self.data[player]["scores"] - scores = sorted(scores.items(), key=lambda x: x[0]) - scores = [i[1] for i in scores] - return scores + return sorted( + self.fantasy_team[self.team1] + self.fantasy_team[self.team2], + key=lambda i: i["score"], + )[-2:] - def predict(self, scores): + def get_score(self, role: str, match_type: str, score_info) -> float: """ - Returns the predicted score - :param : scores : A numpy array with the scores of all matches the - player has played - :type : numpy.array() - :rtype : float + Function to predict the fantasy league score of each player """ - + player_scores = {} + for score_data in score_info: + if role == "batsman": + player_scores[score_data["match_id"]] = sum( + self.batting_dict[key][int(match_type) - 1] * int(score_data[key]) + for key in score_data + if key != "match_id" + ) + elif role == "bowler": + player_scores[score_data["match_id"]] = sum( + self.bowling_dict[key][int(match_type) - 1] * int(score_data[key]) + for key in score_data + if key != "match_id" + ) + elif role == "all-rounder": + player_scores[score_data["match_id"]] = sum( + self.batting_dict[key][int(match_type) - 1] * int(score_data[key]) + for key in score_data + if key + not in [ + "match_id", + "wicket", + "Maiden", + "4-wicket-haul", + "5-wicket-haul", + ] + ) + sum( + self.bowling_dict[key][int(match_type) - 1] * int(score_data[key]) + for key in score_data + if key + not in [ + "match_id", + "runs", + "boundaries", + "sixes", + "100", + "50", + "duck", + ] + ) + elif role == "wicket-keeper": + player_scores[score_data["match_id"]] = sum( + self.batting_dict[key][int(match_type) - 1] * int(score_data[key]) + for key in score_data + if key not in ["match_id", "Catch", "Stump"] + ) + sum( + self.wk_dict[key][int(match_type) - 1] * int(score_data[key]) + for key in score_data + if key + not in [ + "match_id", + "runs", + "boundaries", + "sixes", + "100", + "50", + "duck", + ] + ) + scores = [player_scores[k] for k in sorted(player_scores)] regr = LinearRegression(fit_intercept=True) - y_train = np.array(scores[len(scores) - self.value :]).reshape(-1, 1) - x_train = np.array(range(self.value)).reshape(-1, 1) + y_train = np.array(scores).reshape(-1, 1) + x_train = np.array(range(5)).reshape(-1, 1) try: regr.fit(x_train, y_train) - pred = regr.predict(np.array(self.value).reshape(1, -1)) + pred = regr.predict(np.array(5).reshape(1, -1)) if pred[0][0] < 0: result = 0 else: @@ -221,28 +127,74 @@ def predict(self, scores): result = -1 return result + def get_min_team(self, players): + """ + Gets the min team as per the fantasy league + """ + role_score_map = { + "batsman": sorted( + [player for player in players if player["role"] == "batsman"], + key=lambda i: i["score"], + )[-3:], + "bowler": sorted( + [player for player in players if player["role"] == "bowler"], + key=lambda i: i["score"], + )[-3:], + "all-rounder": sorted( + [player for player in players if player["role"] == "all-rounder"], + key=lambda i: i["score"], + reverse=True, + )[0:1], + "wicket-keeper": sorted( + [player for player in players if player["role"] == "wicket-keeper"], + key=lambda i: i["score"], + reverse=True, + )[:1], + } -def get_role_team(data): - """ - Returns the player names and score corresponding to a role - from the files dataframe - :param role : role of the players in the dataframe - :type str - :param role_data : dataframe of the list of players and files - :type pandas.DataFrame() - :param file_name : file name of the match - :type str - :rtype: dict(str: float) - """ - - team = {} + for role in role_score_map: + for player in role_score_map[role]: + if player["team"] == self.team1: + self.fantasy_team[self.team1].append(player) + elif player["team"] == self.team2: + self.fantasy_team[self.team2].append(player) - for player_det in data.keys(): - if player_det not in team: - team[player_det] = {} - team[player_det]["score"] = Predict(player_det, data).result - team[player_det]["team"] = data[player_det]["team"] - wkt = sorted(team.items(), key=lambda x: x[1]["score"], reverse=True) - wkteam = {i[0]: i[1] for i in wkt} + return self.fantasy_team[self.team1] + self.fantasy_team[self.team2] - return wkteam + def fetch_fantasy_team( + self, player_team1: List[str], player_team2: List[str], match_type: str + ): + """ + Builds the fantasy Team + """ + players = self.espn.get_player_dets(player_team1, self.team1) + players += self.espn.get_player_dets(player_team2, self.team2) + remove = [] + for player in players: + score_info = self.espn.get_match_det( + player["player_id"], player["role"], match_type + ) + if len(score_info) == 5: + player["score"] = self.get_score(player["role"], match_type, score_info) + else: + remove.append(player) + + for player in remove: + players.remove(player) + + remove = self.get_min_team(players) + + for player in remove: + players.remove(player) + + for player in sorted(players, key=lambda i: i["score"]): + if ( + len(self.fantasy_team[self.team1]) + len(self.fantasy_team[self.team2]) + ) == 11: + break + if player["team"] == self.team1: + if len(self.fantasy_team[self.team1]) != 7: + self.fantasy_team[self.team1].append(player) + elif player["team"] == self.team2: + if len(self.fantasy_team[self.team2]) != 7: + self.fantasy_team[self.team2].append(player) diff --git a/app/fantasy_cricket/templates/Playing_11.html b/app/fantasy_cricket/templates/Playing_11.html old mode 100644 new mode 100755 index 5647a46c..2be75cbb --- a/app/fantasy_cricket/templates/Playing_11.html +++ b/app/fantasy_cricket/templates/Playing_11.html @@ -1,25 +1,10 @@ - Choose your playing 11 - + Select 11 Players From Each Team

-
+
@@ -45,10 +30,10 @@

{% for player in squads[0] %} - {{player}} + {{player['name']}} - + {% endfor %} @@ -66,10 +51,10 @@

{% for player in squads[1] %} - {{player}} + {{player['name']}} - + {% endfor %} @@ -85,7 +70,7 @@

- Loading + Loading

Loading....

diff --git a/app/fantasy_cricket/templates/index.html b/app/fantasy_cricket/templates/index.html old mode 100644 new mode 100755 index 5340b9d4..520fc272 --- a/app/fantasy_cricket/templates/index.html +++ b/app/fantasy_cricket/templates/index.html @@ -1,19 +1,4 @@ - @@ -24,13 +9,12 @@ - Fantasy-cricket Prediction - + - + Results Page @@ -48,140 +33,29 @@

Your Recommended Team

- - - -
-
-
- -
{{ t6 }}{{ c6 }}{{ v6 }}
-
-
-
- -
{{ t7 }}{{ c7 }}{{ v7 }}
-
-
-
- -
{{ t8 }}{{ c8 }}{{ v8 }}
-
-
-
- -
{{ t9 }}{{ c9 }}{{ v9 }}
-
-
-
- -
{{ t10 }}{{ c10 }}{{ v10 }}
-
+

+ {% for player in team[5:] %}
-
{{ t11 }}{{ c11 }}{{ v11 }}
+
{{ player["name"] }}{{ player["captain"] }}
+ {% endfor %}
- -
+ {% for player in team[0:5] %}
-
{{ t1 }}{{ c1 }}{{ v1 }}
-
-
-
- -
{{ t2 }}{{ c2 }}{{ v2 }}
-
-
- -
{{ t3 }}{{ c3 }}{{ v3 }}
-
-
-
- -
{{ t4 }}{{ c4 }}{{ v4 }}
-
-
-
- -
{{ t5 }}{{ c5 }}{{ v5 }}
+
{{ player["name"] }}{{ player["captain"] }}
+ + {% endfor %}
diff --git a/app/fantasy_cricket/utils.py b/app/fantasy_cricket/utils.py deleted file mode 100644 index 207bf642..00000000 --- a/app/fantasy_cricket/utils.py +++ /dev/null @@ -1,92 +0,0 @@ -""" -Module which helps to get current match data -Copyright (C) 2020 Royston E Tauro & Sammith S Bharadwaj & Shreyas Raviprasad - - This program is free software: you can redistribute it and/or modify - it under the terms of the GNU Affero General Public License as published - by the Free Software Foundation, either version 3 of the License, or - (at your option) any later version. - - This program is distributed in the hope that it will be useful, - but WITHOUT ANY WARRANTY; without even the implied warranty of - MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the - GNU Affero General Public License for more details. -- - You should have received a copy of the GNU Affero General Public License - along with this program. If not, see . -""" - -import json -from pycricbuzz import Cricbuzz - - -class Matches: - """ - Class which gets and parses matches within 24 hours period - """ - - def __init__(self): - """ - cricket: class of cricbuzz - supported teams: supported teams by our module - flags: flags json with links - """ - - self.cricket = Cricbuzz() - - self.supported_teams = [ - "India", - "Australia", - "New Zealand", - "England", - "Bangladesh", - "South Africa", - "West Indies", - "Pakistan", - "Afghanistan", - "Sri Lanka", - ] - with open("app/fantasy_cricket/data/flags.json") as flag_file: - self.flags = json.load(flag_file) - - def get_match(self): - """ - Gets current matches dict - """ - matches = [] - for match in self.cricket.matches(): - - if ( - match["team1"]["name"] in self.supported_teams - and match["team2"]["name"] in self.supported_teams - #and match["mchstate"] == "preview" - ): - matches.append( - ( - match["team1"], - match["team2"], - self.flags["countries"][match["team1"]["name"]], - self.flags["countries"][match["team2"]["name"]], - ) - ) - return matches - - def get_squad_file_match_type(self, teams): - """ - Gets squad file based on teams - """ - - for match in self.cricket.matches(): - - if ( - match["team1"]["name"] == teams[0] - and match["team2"]["name"] == teams[1] - ): - match_det = ( - match["team1"]["squad_bench"] + match["team1"]["squad"], - match["team2"]["squad_bench"] + match["team2"]["squad"], - match["srs"] + match["mnum"], - match["type"] - ) - break - return match_det diff --git a/app/main.py b/app/main.py old mode 100644 new mode 100755 index 35e7fb4d..43efaab8 --- a/app/main.py +++ b/app/main.py @@ -16,14 +16,14 @@ along with this program. If not, see . """ -import os +from typing import List from fastapi.templating import Jinja2Templates from fastapi.responses import HTMLResponse, RedirectResponse, FileResponse -from fastapi import FastAPI, Form, Request, status +from fastapi import FastAPI, Form, Request, status, Query from fastapi.staticfiles import StaticFiles from fastapi.encoders import jsonable_encoder -from app.fantasy_cricket.team import Teams -from app.fantasy_cricket.utils import Matches +from app.fantasy_cricket.fantasy_leagues import Dream11 +from app.fantasy_cricket.matches import Matches # pylint: disable=missing-function-docstring # pylint: disable=global-variable-undefined @@ -41,18 +41,15 @@ @app.get("/", response_class=HTMLResponse) def home(request: Request): - matches = cricket.get_match() - teams = [ - [match[0]["name"], match[1]["name"], match[2]["flag"], match[3]["flag"]] - for match in matches - ] + matches = cricket.get_upcoming_match() return templates.TemplateResponse( - "index.html", {"request": request, "teams": teams} + "index.html", {"request": request, "teams": matches} ) @app.post("/") -async def home_post(match: str = Form(...)): +def home_post(match: str = Form(...)): + response = RedirectResponse( url="/playing11?team1=" + match.split(" vs ")[0] @@ -64,106 +61,56 @@ async def home_post(match: str = Form(...)): @app.get("/playing11", response_class=HTMLResponse) -def playing_11(request: Request, team1, team2): - - squad1, squad2, file, match_type = cricket.get_squad_file_match_type([team1, team2]) +def playing_11(request: Request, team1: str = Query(...), team2: str = Query(...)): + match_data = cricket.get_squad_match_type([team1, team2]) return templates.TemplateResponse( "Playing_11.html", { "request": request, - "squads": [squad1, squad2], - "file": file, - "match_type": match_type, + "squads": [match_data["team1_squad"], match_data["team2_squad"]], + "match_type": match_data["match_type"], "teams": [team1, team2], }, ) @app.post("/playing11") -async def playing_11_post(request: Request, file, match_type, team1, team2): - playings_11 = list(jsonable_encoder(await request.form()).keys()) - playings_11.remove("Confirm") - players1 = '"' + '","'.join(playings_11[0:11]) + '"' - players2 = '"' + '","'.join(playings_11[11:]) + '"' - - scrape_with_crochet( - file=file, - match_type=match_type, - teams=[team1, team2], - players2=players2, - players1=players1, - ) - return RedirectResponse( - url="/results?file=" + file, status_code=status.HTTP_302_FOUND +async def playing_11_post( + request: Request, + team1: str = Query(...), + team2: str = Query(...), + match_type: str = Query(...), +): + + play_11 = list(jsonable_encoder(await request.form()).keys()) + play_11.remove("Confirm") + url = ( + "/results/?match_type=" + match_type + "&team=" + team1 + "&team=" + team2 + "&" ) + for player in play_11[0:11]: + url += "player_team1=" + player + "&" + for player in play_11[11:]: + url += "player_team2=" + player + "&" + return RedirectResponse(url=url[:-1], status_code=status.HTTP_302_FOUND) @app.get("/results", response_class=HTMLResponse) -def result(request: Request, file): - t_d = Teams("app/fantasy_cricket/data/" + file + ".json") - captain, vcaptain = t_d.team() - team_list = t_d.player - players = [] - for i in team_list: - if i == captain: - tag_c = "(C)" - elif i == vcaptain: - tag_c = "(VC)" - else: - tag_c = "" - players.append(i + tag_c) - captain_list = [0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0] - vcaptain_list = [0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0] - for i, _ in enumerate(players): - if "(C)" in players[i]: - captain_list[i] = "(C)" - vcaptain_list[i] = "" - players[i] = players[i][:-3] - elif "(VC)" in players[i]: - vcaptain_list[i] = "(VC)" - captain_list[i] = "" - players[i] = players[i][:-4] - else: - vcaptain_list[i] = "" - captain_list[i] = "" +def result( + request: Request, + team: List[str] = Query(...), + match_type: str = Query(...), + player_team1: List[str] = Query(...), + player_team2: List[str] = Query(...), +): + t_d = Dream11(team[0], team[1]) + t_d.fetch_fantasy_team(player_team1, player_team2, match_type) + team = t_d.get_fantasy_team() return templates.TemplateResponse( "result.html", - context={ + { "request": request, - "c1": captain_list[0], - "v1": vcaptain_list[0], - "t1": players[0], - "c2": captain_list[1], - "v2": vcaptain_list[1], - "t2": players[1], - "c3": captain_list[2], - "v3": vcaptain_list[2], - "t3": players[2], - "c4": captain_list[3], - "v4": vcaptain_list[3], - "t4": players[3], - "c5": captain_list[4], - "v5": vcaptain_list[4], - "t5": players[4], - "c6": captain_list[5], - "v6": vcaptain_list[5], - "t6": players[5], - "c7": captain_list[6], - "v7": vcaptain_list[6], - "t7": players[6], - "c8": captain_list[7], - "v8": vcaptain_list[7], - "t8": players[7], - "c9": captain_list[8], - "v9": vcaptain_list[8], - "t9": players[8], - "c10": captain_list[9], - "v10": vcaptain_list[9], - "t10": players[9], - "c11": captain_list[10], - "v11": vcaptain_list[10], - "t11": players[10], + "team": team, }, ) @@ -171,23 +118,3 @@ def result(request: Request, file): @app.get("/robots.txt") def robots(): return FileResponse("app/robots.txt") - - -def scrape_with_crochet(file, match_type, teams, players1, players2): - - v_open = os.popen( - 'python3 -m scrapy crawl howstat -a match_type="' - + match_type - + '" -a team1="' - + teams[0] - + '" -a team2="' - + teams[1] - + '" -a players1=' - + players1 - + " -a players2=" - + players2 - + ' -a file="' - + file - + '" --loglevel DEBUG', - ) - v_open.close() diff --git a/app/robots.txt b/app/robots.txt old mode 100644 new mode 100755 index ac25b5fa..f7afb9da --- a/app/robots.txt +++ b/app/robots.txt @@ -2,5 +2,5 @@ User-agent: * Allow: / -Disallow: /playing11 -Disallow: /results \ No newline at end of file +Allow: /playing11 +Allow: /results \ No newline at end of file diff --git a/crawler/__init__.py b/crawler/__init__.py deleted file mode 100644 index 13e9dda5..00000000 --- a/crawler/__init__.py +++ /dev/null @@ -1,19 +0,0 @@ -""" - Copyright (C) 2020 Royston E Tauro & Sammith S Bharadwaj & Shreyas Raviprasad - - This program is free software: you can redistribute it and/or modify - it under the terms of the GNU Affero General Public License as published - by the Free Software Foundation, either version 3 of the License, or - (at your option) any later version. - - This program is distributed in the hope that it will be useful, - but WITHOUT ANY WARRANTY; without even the implied warranty of - MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the - GNU Affero General Public License for more details. - - You should have received a copy of the GNU Affero General Public License - along with this program. If not, see . -""" -import sys - -sys.path.insert(1, "..") diff --git a/crawler/fantasy_leagues.py b/crawler/fantasy_leagues.py deleted file mode 100644 index 2d985548..00000000 --- a/crawler/fantasy_leagues.py +++ /dev/null @@ -1,88 +0,0 @@ - -""" -This modules defines all the fantasy leagues that -the project supports - Copyright (C) 2020 Royston E Tauro & Sammith S Bharadwaj & Shreyas Raviprasad - - This program is free software: you can redistribute it and/or modify - it under the terms of the GNU Affero General Public License as published - by the Free Software Foundation, either version 3 of the License, or - (at your option) any later version. - - This program is distributed in the hope that it will be useful, - but WITHOUT ANY WARRANTY; without even the implied warranty of - MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the - GNU Affero General Public License for more details. - - You should have received a copy of the GNU Affero General Public License - along with this program. If not, see . -""" - - -class Scorer: - """ - Scorer class to use different formats of the game - - :py:class `t20`: A T20 dictionary which contains scoring metrics - :py:class `odi`: A ODI dictionary which contains scoring metrics - :py:class `test`: A TEST dictionary which contains scoring metrics - - :param scoring_dict: A dictionary containing scoring metrics. - Each value represents a list where index 0 represents `T20`, - 1 represents `ODI`, 2 represents `TEST` - """ - - def __init__(self, scoring_dict): - - self.t20 = {key: scoring_dict[key][0] for key in scoring_dict} - self.odi = {key: scoring_dict[key][1] for key in scoring_dict} - self.test = {key: scoring_dict[key][2] for key in scoring_dict} - - def get_score(self, stats, playing_format): - """ - Function which sums the score for that platform - depending on the format of the game - - :param playing_format: One of `ODI`,`T20`,`TEST` - """ - type_map = {"ODI": self.odi, "T20": self.t20, "TEST": self.test} - return sum(type_map[playing_format][key] * stats[key] for key in stats) - - -class Dream11: - """Dream11 League - - Supported platforms: - * ODI - * T20 - * TEST - """ - - name = "Dream11" - - batting_dict = Scorer( - { - "runs": [1, 1, 1], - "boundaries": [1, 1, 1], - "sixes": [2, 2, 2], - "50": [8, 4, 4], - "100": [16, 8, 8], - "duck": [-2, -3, -4], - } - ) - - bowling_dict = Scorer( - { - "wicket": [25, 25, 16], - "4-wicket-haul": [8, 4, 4], - "5-wicket-haul": [16, 8, 8], - "Maiden": [4, 8, 0], - } - ) - - wk_dict = Scorer( - { - "Catch": [8, 8, 8], - "Stump": [12, 12, 12], - } - ) diff --git a/crawler/items.py b/crawler/items.py deleted file mode 100644 index d7374db5..00000000 --- a/crawler/items.py +++ /dev/null @@ -1,41 +0,0 @@ -# Define here the models for your scraped items -# -# See documentation in: -# https://docs.scrapy.org/en/latest/topics/items.html - -""" - Copyright (C) 2020 Royston E Tauro & Sammith S Bharadwaj & Shreyas Raviprasad - - This program is free software: you can redistribute it and/or modify - it under the terms of the GNU Affero General Public License as published - by the Free Software Foundation, either version 3 of the License, or - (at your option) any later version. - - This program is distributed in the hope that it will be useful, - but WITHOUT ANY WARRANTY; without even the implied warranty of - MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the - GNU Affero General Public License for more details. - - You should have received a copy of the GNU Affero General Public License - along with this program. If not, see . -""" - - -import scrapy - - -class PlayerItem(scrapy.Item): - """ - Class scrapes name of the player - Role of the player - Score he scored in that game - Team he is playing for - Date of the match - File it has been stored in - """ - name = scrapy.Field() - role = scrapy.Field() - score = scrapy.Field() - team = scrapy.Field() - date = scrapy.Field() - file = scrapy.Field() diff --git a/crawler/pipelines.py b/crawler/pipelines.py deleted file mode 100644 index a210acb1..00000000 --- a/crawler/pipelines.py +++ /dev/null @@ -1,57 +0,0 @@ -# Define your item pipelines here -# -# Don't forget to add your pipeline to the ITEM_PIPELINES setting -# See: https://docs.scrapy.org/en/latest/topics/item-pipeline.html - -""" - Copyright (C) 2020 Royston E Tauro & Sammith S Bharadwaj & Shreyas Raviprasad - - This program is free software: you can redistribute it and/or modify - it under the terms of the GNU Affero General Public License as published - by the Free Software Foundation, either version 3 of the License, or - (at your option) any later version. - - This program is distributed in the hope that it will be useful, - but WITHOUT ANY WARRANTY; without even the implied warranty of - MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the - GNU Affero General Public License for more details. - - You should have received a copy of the GNU Affero General Public License - along with this program. If not, see . -""" -# useful for handling different item types with a single interface -import json -from statistics import mode -from itemadapter import ItemAdapter - - -class CricketcrawlerPipeline: - """ - Processes output given by the crawler and stores it in a json file - """ - def open_spider(self, spider): - """ - Works when spider starts crawling - """ - self.items = {} - self.name = None - - def close_spider(self, spider): - """ - Works when the spider stops crawling - """ - for item in self.items: - assert len(self.items[item]["role"]) == 5, f"{item}" - self.items[item]["role"] = mode(self.items[item]["role"]) - with open(self.name, "w") as f_p: - json.dump(self.items, f_p, indent=6) - - def process_item(self, item, spider): - """ - Processes files as the items are yielded - """ - self.name = f'app/fantasy_cricket/data/{item["file"]}.json' - if item["name"] not in self.items: - self.items[item["name"]] = {"role": [], "team": item["team"], "scores": {}} - self.items[item["name"]]["role"].append(item["role"]) - self.items[item["name"]]["scores"][item["date"]] = item["score"] diff --git a/crawler/spiders/__init__.py b/crawler/spiders/__init__.py deleted file mode 100644 index be112f24..00000000 --- a/crawler/spiders/__init__.py +++ /dev/null @@ -1,24 +0,0 @@ -# This package will contain the spiders of your Scrapy project -# -# Please refer to the documentation for information on how to create and manage -# your spiders. -""" - Copyright (C) 2020 Royston E Tauro & Sammith S Bharadwaj & Shreyas Raviprasad - - This program is free software: you can redistribute it and/or modify - it under the terms of the GNU Affero General Public License as published - by the Free Software Foundation, either version 3 of the License, or - (at your option) any later version. - - This program is distributed in the hope that it will be useful, - but WITHOUT ANY WARRANTY; without even the implied warranty of - MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the - GNU Affero General Public License for more details. - - You should have received a copy of the GNU Affero General Public License - along with this program. If not, see . -""" - -import sys - -sys.path.insert(1, "..") diff --git a/crawler/spiders/howstat.py b/crawler/spiders/howstat.py deleted file mode 100644 index 4d1b0c5c..00000000 --- a/crawler/spiders/howstat.py +++ /dev/null @@ -1,305 +0,0 @@ -""" - Copyright (C) 2020 Royston E Tauro & Sammith S Bharadwaj & Shreyas Raviprasad - - This program is free software: you can redistribute it and/or modify - it under the terms of the GNU Affero General Public License as published - by the Free Software Foundation, either version 3 of the License, or - (at your option) any later version. - - This program is distributed in the hope that it will be useful, - but WITHOUT ANY WARRANTY; without even the implied warranty of - MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the - GNU Affero General Public License for more details. - - You should have received a copy of the GNU Affero General Public License - along with this program. If not, see . -""" -from scrapy import Request, Spider -from crawler.fantasy_leagues import Dream11 -from crawler.items import PlayerItem - - -class HowstatSpider(Spider): - """ - Spider which crawls through howstat.com - """ - name = "howstat" - allowed_domains = ["howstat.com"] - - start_urls = ["http://www.howstat.com/cricket/Statistics/Players/PlayerListCurrent.asp"] - def __init__(self, players1="", players2="", match_type="", *args, **kwargs): - super(HowstatSpider, self).__init__(*args, **kwargs) - self.names = { - "last": {self.team1: [], self.team2: []}, - "first": {self.team1: [], self.team2: []}, - } - for player in players1.split(","): - player_id = player.split() - if ( - player_id[0].lower().strip() == "de" - or player_id[0].lower().strip() == "du" - or player_id[0].lower().strip() == "van" - ): - player_id = [' '.join(player_id)] - if len(player_id) == 1: - self.names["last"][self.team1].append(player_id[0].lower().strip()) - self.names["first"][self.team1].append("") - elif len(player_id) >= 1: - self.names["last"][self.team1].append(player_id[-1].lower().strip()) - self.names["first"][self.team1].append(player_id[0].lower().strip()) - for player in players2.split(","): - player_id = player.split() - if len(player_id) == 1: - self.names["last"][self.team2].append(player_id[0].lower().strip()) - self.names["first"][self.team2].append("") - elif len(player_id) >= 1: - self.names["last"][self.team2].append(player_id[-1].lower().strip()) - self.names["first"][self.team2].append(player_id[0].lower().strip()) - assert ( - len(self.names["last"][self.team1]) - == 11 - == len(self.names["first"][self.team1]) - == len(self.names["first"][self.team2]) - == len(self.names["last"][self.team2]) - ) - if match_type == "TEST": - self.match_type = "" - else: - self.match_type = "_" + match_type - self.matches = {} - self.count = 0 - - def parse(self, response): - """ - Returns a request for the player found in the parsed url - """ - comma_map = { - "India": 1, - "Australia": 1, - "New Zealand": 1, - "England": 1, - "Bangladesh": 0, - "South Africa": 1, - "West Indies": 1, - "Pakistan": 0, - "Afghanistan": 0, - "Sri Lanka": 1, - } - teams = { - self.team1: response.selector.xpath( - "//table[@class='TableLined']/tr[td[3]/text()[contains(.,'" - + self.team1 - + "')]]/td[1]" - ), - self.team2: response.selector.xpath( - "//table[@class='TableLined']/tr[td[3]/text()[contains(.,'" - + self.team2 - + "')]]/td[1]" - ), - } - players = {} - for team in teams: - players[team] = [] - for player in teams[team]: - player_id = player.xpath("a/text()").get() - if comma_map[team]: - player_id = player_id.split(",") - try: - i = self.names["last"][team].index(player_id[0].lower().strip()) - if self.names["first"][team][i] == "": - players[team].append(player.xpath("a")) - else: - for initial in player_id[1].split(): - if ( - self.names["first"][team][i][0].lower() - == initial.lower().strip() - ): - players[team].append(player.xpath("a")) - break - except ValueError: - pass - else: - player_id = (player_id.split()[0], player_id.split()[-1]) - try: - i = self.names["last"][team].index(player_id[1].lower().strip()) - if self.names["first"][team][i] == "": - players[team].append(player.xpath("a")) - else: - if player_id[0].lower().strip() in self.names["first"][team]: - players[team].append(player.xpath("a")) - except ValueError: - pass - for team in players: - for player in players[team]: - player_id = player.xpath("@href").get().split("?")[1] - yield Request( - "http://www.howstat.com/cricket/Statistics/Players/PlayerProgressSummary" - + self.match_type - + ".asp?" - + player_id, - callback=self.parse_last5, - cb_kwargs={"team": team}, - ) - - def parse_last5(self, response, team): - """ - Gets the data of last 5 games for each player - """ - name = ( - response.xpath("//td[contains(@class, 'Banner')]/text()") - .get() - .strip() - .split("(")[0] - .strip() - ) - if self.match_type != "": - matches = response.xpath( - '//table[@class = "TableLined"]/tr[position()>last()-5]/td[2]/a' - ) - else: - matches = response.xpath( - '//table[@class = "TableLined"]/tr[position()>last()-10]/td[2]/a' - ) - crawl = False - if len(matches) >= 5: - crawl = True - matches = matches[len(matches)-5:] - for match in matches: - if crawl: - yield Request( - "http://www.howstat.com/cricket/Statistics" - + match.xpath("@href").get().split("..")[1], - callback=self.parse_scorecard, - cb_kwargs={ - "name": name, - "pid" : response.url.split("?")[-1], - "team" : team, - "date" : match.get().split('>')[1].split('<')[0] - }, - dont_filter=True, - ) - - def parse_scorecard(self, response, name, pid, team, date): - """ - parses the Scorecard - """ - scorelisxpath = ( - "//table/tr/td/table/tr/td/table/tr[td[a[@href[contains(.,'" - + pid - + "')]]]]" - ) - lis = response.selector.xpath(scorelisxpath) - batting_dict = {} - bowling_dict = {} - keeping_dict = {} - role = None - for score in lis: - if score.xpath("td[1]/text()[contains(.,'†')]").get(): - role = "wk" - elif score.xpath("td[2]/text()[contains(.,'.')]"): - if "Maiden" not in bowling_dict: - bowling_dict["Maiden"] = 0 - bowling_dict["Maiden"] += int(score.xpath("td[3]/text()").get().strip()) - if "wicket" not in bowling_dict: - bowling_dict["wicket"] = 0 - bowling_dict["wicket"] += int(score.xpath("td[5]/text()").get().strip()) - if "4-wicket-haul" not in bowling_dict: - bowling_dict["4-wicket-haul"] = 0 - if "5-wicket-haul" not in bowling_dict: - bowling_dict["5-wicket-haul"] = 0 - if int(score.xpath("td[5]/text()").get().strip()) >= 5: - bowling_dict["5-wicket-haul"] += 1 - elif int(score.xpath("td[5]/text()").get().strip()) >= 4: - bowling_dict["4-wicket-haul"] += 1 - else: - current = score - for _ in range(0, 4): - if role == "wk": - break - current = current.xpath("following-sibling::tr") - if current.xpath("td[1][contains(.,'Extras')]"): - role = "bowl" - break - if "runs" not in batting_dict: - batting_dict["runs"] = 0 - if score.xpath("td[3]/text()").get().strip() == "": - batting_dict["runs"] = 0 - batting_dict["boundaries"] = 0 - batting_dict["sixes"] = 0 - batting_dict["50"] = 0 - batting_dict["100"] = 0 - batting_dict["duck"] = 0 - continue - batting_dict["runs"] += int(score.xpath("td[3]/text()").get().strip()) - if "boundaries" not in batting_dict: - batting_dict["boundaries"] = 0 - batting_dict["boundaries"] += int( - score.xpath("td[5]/text()").get().strip() - ) - if "sixes" not in batting_dict: - batting_dict["sixes"] = 0 - batting_dict["sixes"] += int(score.xpath("td[6]/text()").get().strip()) - if "50" not in batting_dict: - batting_dict["50"] = 0 - if "100" not in batting_dict: - batting_dict["100"] = 0 - if "duck" not in batting_dict: - batting_dict["duck"] = 0 - if int(score.xpath("td[3]/text()").get().strip()) >= 100: - batting_dict["100"] += 1 - elif int(score.xpath("td[3]/text()").get().strip()) >= 50: - batting_dict["50"] += 1 - elif ( - int(score.xpath("td[3]/text()").get().strip()) == 50 - and role != "bowl" - ): - batting_dict["duck"] += 1 - if role == "wk": - wk_score = score.xpath( - "//table/tr/td/table/tr/td/table/tr[td[2][@valign and @width]/text()[contains(.,'" - + name.split()[-1].strip() - + "')]]" - ).xpath("td[2]/text()") - if wk_score: - if "Catch" not in keeping_dict: - keeping_dict["Catch"] = 0 - if "Stump" not in keeping_dict: - keeping_dict["Stump"] = 0 - for wk_s in wk_score: - if "c †" in wk_s.get(): - keeping_dict["Catch"] += 1 - elif "st †" in wk_s.get(): - keeping_dict["Stump"] += 1 - - if bowling_dict != {} and role != "bowl": - role = "all" - elif bowling_dict == {} and role != "wk": - role = "bat" - score = 0 - match_type = {"_ODI": "ODI", "_T20": "T20", "": "TEST"} - if role == "wk": - score += Dream11.wk_dict.get_score( - keeping_dict, match_type[self.match_type] - ) - score += Dream11.batting_dict.get_score( - batting_dict, match_type[self.match_type] - ) - elif role == "bowl": - score += Dream11.bowling_dict.get_score( - bowling_dict, match_type[self.match_type] - ) - elif role == "all": - score += Dream11.bowling_dict.get_score( - bowling_dict, match_type[self.match_type] - ) - score += Dream11.batting_dict.get_score( - batting_dict, match_type[self.match_type] - ) - elif role == "bat": - score += Dream11.batting_dict.get_score( - batting_dict, match_type[self.match_type] - ) - - yield PlayerItem( - name=name, score=score, role=role, date=date, team=team, file=self.file - ) diff --git a/Dockerfile b/docker/11tastic/Dockerfile old mode 100644 new mode 100755 similarity index 63% rename from Dockerfile rename to docker/11tastic/Dockerfile index f1cf0de6..c12ff3d0 --- a/Dockerfile +++ b/docker/11tastic/Dockerfile @@ -6,10 +6,4 @@ RUN apt-get update && \ rm -rf /var/lib/apt/lists/* COPY ./requirements.txt /app/requirements.txt RUN pip install --no-cache-dir --user -r /app/requirements.txt; rm -r /tmp - -FROM tiangolo/uvicorn-gunicorn-fastapi:python3.8-slim -COPY --from=compile-image /root/.local /root/.local COPY ./app /app/app -COPY ./crawler /app/crawler -COPY ./scrapy.cfg /app/scrapy.cfg -ENV PYTHONPATH=/app \ No newline at end of file diff --git a/docker/docker-compose-test.yaml b/docker/docker-compose-test.yaml new file mode 100644 index 00000000..8c092e60 --- /dev/null +++ b/docker/docker-compose-test.yaml @@ -0,0 +1,17 @@ +version: '3.3' +services: + espncricinfo: + build: + context: .. + dockerfile: docker/espncricinfo/Dockerfile + ports: + - "9080:9080" + environment: + - LOG_LEVEL=DEBUG + test: + build: + context: .. + dockerfile: docker/test/Dockerfile + depends_on: + - espncricinfo + \ No newline at end of file diff --git a/docker-compose.yaml b/docker/docker-compose.yaml old mode 100644 new mode 100755 similarity index 50% rename from docker-compose.yaml rename to docker/docker-compose.yaml index 3ffde91a..04d3749f --- a/docker-compose.yaml +++ b/docker/docker-compose.yaml @@ -1,14 +1,22 @@ version: '3.3' services: + espncricinfo: + image: espncricinfo:latest + ports: + - "9080:9080" + environment: + - LOG_LEVEL=DEBUG app: - image: best11fantasycricket:latest + image: best11:latest + depends_on: + - espncricinfo ports: - "8080:80" environment: - MAX_WORKERS=1 - - LOG_LEVEL=DEBUG deploy: resources: limits: cpus: '1' - memory: 100M \ No newline at end of file + memory: 100M + \ No newline at end of file diff --git a/docker/espncricinfo/Dockerfile b/docker/espncricinfo/Dockerfile new file mode 100644 index 00000000..d1116f37 --- /dev/null +++ b/docker/espncricinfo/Dockerfile @@ -0,0 +1,11 @@ +FROM python:3 + +WORKDIR /crawler + +RUN pip install --no-cache-dir scrapyrt; rm -r /tmp + +COPY ./espncricinfo /crawler/espncricinfo +COPY ./scrapy.cfg /crawler/scrapy.cfg + +EXPOSE 9080 +CMD ["scrapyrt", "-i", "0.0.0.0"] \ No newline at end of file diff --git a/docker/test/Dockerfile b/docker/test/Dockerfile new file mode 100644 index 00000000..e9a86b0d --- /dev/null +++ b/docker/test/Dockerfile @@ -0,0 +1,13 @@ +FROM python:3 + +WORKDIR /test + +COPY ./requirements.txt /test/requirements.txt +RUN pip install --no-cache-dir -r requirements.txt; rm -r /tmp +RUN pip install --no-cache-dir pytest; + +COPY ./test /test/test +COPY ./app /test/app + +CMD ["pytest"] + diff --git a/espncricinfo/__init__.py b/espncricinfo/__init__.py new file mode 100755 index 00000000..e69de29b diff --git a/espncricinfo/items.py b/espncricinfo/items.py new file mode 100755 index 00000000..07a8cb46 --- /dev/null +++ b/espncricinfo/items.py @@ -0,0 +1,37 @@ +# Define here the models for your scraped items +# +# See documentation in: +# https://docs.scrapy.org/en/latest/topics/items.html + +import scrapy + + +class PlayerItem(scrapy.Item): + + name = scrapy.Field() + image = scrapy.Field() + role = scrapy.Field() + player_id = scrapy.Field() + + +class ScoreItem(scrapy.Item): + + runs = scrapy.Field() + boundaries = scrapy.Field() + sixes = scrapy.Field() + wicket = scrapy.Field() + Maiden = scrapy.Field() + Catch = scrapy.Field() + Stump = scrapy.Field() + match_id = scrapy.Field() + + +class LiveMatchItem(scrapy.Item): + + team1 = scrapy.Field() + team2 = scrapy.Field() + match_id = scrapy.Field() + team1_squad = scrapy.Field() + team2_squad = scrapy.Field() + team1_id = scrapy.Field() + team2_id = scrapy.Field() diff --git a/crawler/settings.py b/espncricinfo/settings.py old mode 100644 new mode 100755 similarity index 61% rename from crawler/settings.py rename to espncricinfo/settings.py index 4a6493f8..467298b2 --- a/crawler/settings.py +++ b/espncricinfo/settings.py @@ -1,20 +1,4 @@ -""" - Copyright (C) 2020 Royston E Tauro & Sammith S Bharadwaj & Shreyas Raviprasad - - This program is free software: you can redistribute it and/or modify - it under the terms of the GNU Affero General Public License as published - by the Free Software Foundation, either version 3 of the License, or - (at your option) any later version. - - This program is distributed in the hope that it will be useful, - but WITHOUT ANY WARRANTY; without even the implied warranty of - MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the - GNU Affero General Public License for more details. - - You should have received a copy of the GNU Affero General Public License - along with this program. If not, see . -""" -# Scrapy settings for cricketcrawler project +# Scrapy settings for espncricinfo project # # For simplicity, this file contains only settings considered important or # commonly used. You can find more settings consulting the documentation: @@ -23,16 +7,18 @@ # https://docs.scrapy.org/en/latest/topics/downloader-middleware.html # https://docs.scrapy.org/en/latest/topics/spider-middleware.html -BOT_NAME = "crawler" +import os -SPIDER_MODULES = ["crawler.spiders"] -NEWSPIDER_MODULE = "crawler.spiders" +BOT_NAME = "espncricinfo" + +SPIDER_MODULES = ["espncricinfo.spiders"] +NEWSPIDER_MODULE = "espncricinfo.spiders" # Crawl responsibly by identifying yourself (and your website) on the user-agent -# USER_AGENT = 'cricketcrawler (+http://www.yourdomain.com)' +# USER_AGENT = 'espncricinfo (+http://www.yourdomain.com)' -# Obey robots.txt rules- +# Obey robots.txt rules ROBOTSTXT_OBEY = True # Configure maximum concurrent requests performed by Scrapy (default: 16) @@ -41,7 +27,7 @@ # Configure a delay for requests for the same website (default: 0) # See https://docs.scrapy.org/en/latest/topics/settings.html#download-delay # See also autothrottle settings and docs -DOWNLOAD_DELAY = 0.5 +# DOWNLOAD_DELAY = 3 # The download delay setting will honor only one of: # CONCURRENT_REQUESTS_PER_DOMAIN = 16 # CONCURRENT_REQUESTS_PER_IP = 16 @@ -60,14 +46,17 @@ # Enable or disable spider middlewares # See https://docs.scrapy.org/en/latest/topics/spider-middleware.html -# SPIDER_MIDDLEWARES = { -# 'cricketcrawler.middlewares.CricketcrawlerSpiderMiddleware': 543, -# } - # Enable or disable downloader middlewares +if os.getenv("TEST"): + SPIDER_MIDDLEWARES = { + 'scrapy_autounit.AutounitMiddleware': 950 + } + AUTOUNIT_ENABLED = True + + # See https://docs.scrapy.org/en/latest/topics/downloader-middleware.html # DOWNLOADER_MIDDLEWARES = { -# 'cricketcrawler.middlewares.CricketcrawlerDownloaderMiddleware': 543, +# 'espncricinfo.middlewares.EspncricinfoDownloaderMiddleware': 543, # } # Enable or disable extensions @@ -78,29 +67,27 @@ # Configure item pipelines # See https://docs.scrapy.org/en/latest/topics/item-pipeline.html -ITEM_PIPELINES = { - "crawler.pipelines.CricketcrawlerPipeline": 300, -} +# ITEM_PIPELINES = { +# 'espncricinfo.pipelines.EspncricinfoPipeline': 300, +# } # Enable and configure the AutoThrottle extension (disabled by default) # See https://docs.scrapy.org/en/latest/topics/autothrottle.html -AUTOTHROTTLE_ENABLED = True +# AUTOTHROTTLE_ENABLED = True # The initial download delay -AUTOTHROTTLE_START_DELAY = 1 +# AUTOTHROTTLE_START_DELAY = 5 # The maximum download delay to be set in case of high latencies -AUTOTHROTTLE_MAX_DELAY = 60 +# AUTOTHROTTLE_MAX_DELAY = 60 # The average number of requests Scrapy should be sending in parallel to -# each remote serverHTTP status code is not handled or not allowed -AUTOTHROTTLE_TARGET_CONCURRENCY = 1.0 +# each remote server +# AUTOTHROTTLE_TARGET_CONCURRENCY = 1.0 # Enable showing throttling stats for every response received: -AUTOTHROTTLE_DEBUG = True +# AUTOTHROTTLE_DEBUG = False # Enable and configure HTTP caching (disabled by default) # See https://docs.scrapy.org/en/latest/topics/downloader-middleware.html#httpcache-middleware-settings HTTPCACHE_ENABLED = True HTTPCACHE_EXPIRATION_SECS = 0 HTTPCACHE_DIR = "httpcache" -HTTPCACHE_IGNORE_HTTP_CODES = [500] +HTTPCACHE_IGNORE_HTTP_CODES = [] HTTPCACHE_STORAGE = "scrapy.extensions.httpcache.FilesystemCacheStorage" - -RETRY_HTTP_CODES = [502, 503, 504, 400, 408] diff --git a/espncricinfo/spiders/__init__.py b/espncricinfo/spiders/__init__.py new file mode 100755 index 00000000..ebd689ac --- /dev/null +++ b/espncricinfo/spiders/__init__.py @@ -0,0 +1,4 @@ +# This package will contain the spiders of your Scrapy project +# +# Please refer to the documentation for information on how to create and manage +# your spiders. diff --git a/espncricinfo/spiders/match-spider.py b/espncricinfo/spiders/match-spider.py new file mode 100755 index 00000000..39ba3e60 --- /dev/null +++ b/espncricinfo/spiders/match-spider.py @@ -0,0 +1,99 @@ +import scrapy +from espncricinfo.items import ScoreItem + + +class MatchesSpider(scrapy.Spider): + + name = "espn-matches" + allowed_domains = ["espncricinfo.com"] + + def start_requests(self): + return [ + scrapy.Request( + url="https://stats.espncricinfo.com/ci/engine/player/253802.html?class=1&orderby=start&orderbyad=reverse&template=results&type=allround&view=match", + callback=self.parse, + ) + ] + + def parse(self, response): + + matches = response.selector.xpath( + "//a[@href[contains(. , '/ci/engine/match')] and @title]" + )[:5] + pid = response.url.split(".html")[0].split("player/")[1] + score_dict = { + "runs": None, + "boundaries": None, + "sixes": None, + "wicket": None, + "Maiden": None, + "Catch": None, + "Stump": None, + } + keeping_stats = response.selector.xpath( + "//table[caption[contains(.,'Match by match list')]]//tr[td]" + )[:5] + for i, match in enumerate(matches): + score_dict["Catch"] = score_dict["Stump"] = 0 + if "Test" in match.xpath("text()").get(): + score_dict["Catch"] += int( + keeping_stats[i].xpath("td[6]/text()").get().strip() + ) + score_dict["Catch"] += int( + keeping_stats[i].xpath("td[7]/text()").get().strip() + ) + elif ( + "ODI" in match.xpath("text()").get() + or "T20" in match.xpath("text()").get() + ): + score_dict["Catch"] += int( + keeping_stats[i].xpath("td[4]/text()").get().strip() + ) + score_dict["Catch"] += int( + keeping_stats[i].xpath("td[5]/text()").get().strip() + ) + yield scrapy.Request( + url="https://www.espncricinfo.com" + match.xpath("@href").get(), + callback=self.parse_match, + cb_kwargs={ + "pid": pid, + "score_dict": score_dict, + "match_id": match.xpath("text()").get(), + }, + ) + + def parse_match(self, response, pid, score_dict, match_id): + + batsman = response.selector.xpath( + "//table[@class='table batsman']//tr[td[a[@href[contains(., '" + + pid + + "')]]]]" + ) + if batsman: + score_dict["runs"] = score_dict["boundaries"] = score_dict["sixes"] = 0 + for bat in batsman: + score_dict["runs"] += int(bat.xpath("td[3]/text()").get().strip()) + score_dict["boundaries"] += int(bat.xpath("td[6]/text()").get().strip()) + score_dict["sixes"] += int(bat.xpath("td[7]/text()").get().strip()) + + bowler = response.selector.xpath( + "//table[@class='table bowler']//tr[td[a[@href[contains(., '" + + pid + + "')]]]]" + ) + if bowler: + score_dict["wicket"] = score_dict["Maiden"] = 0 + for bowl in bowler: + score_dict["wicket"] += int(bowl.xpath("td[3]/text()").get().strip()) + score_dict["Maiden"] += int(bowl.xpath("td[5]/text()").get().strip()) + + yield ScoreItem( + runs=score_dict["runs"], + boundaries=score_dict["boundaries"], + sixes=score_dict["sixes"], + wicket=score_dict["wicket"], + Maiden=score_dict["Maiden"], + Catch=score_dict["Catch"], + Stump=score_dict["Stump"], + match_id=match_id, + ) diff --git a/espncricinfo/spiders/player-spider.py b/espncricinfo/spiders/player-spider.py new file mode 100755 index 00000000..e4078800 --- /dev/null +++ b/espncricinfo/spiders/player-spider.py @@ -0,0 +1,32 @@ +import scrapy +from espncricinfo.items import PlayerItem + + +class PlayerListSpider(scrapy.Spider): + + name = "espn-players" + allowed_domains = ["espncricinfo.com"] + + def start_requests(self): + return [ + scrapy.Request( + url="https://www.espncricinfo.com/ci/content/player/253802.html", + callback=self.parse, + ) + ] + + def parse(self, response): + + name = response.selector.xpath("//div[@class='ciPlayernametxt']/div/h1/text()") + role = response.selector.xpath( + "//p[@class='ciPlayerinformationtxt' and b/text()[contains(.,'Playing role')]]/span/text()" + ) + image = response.selector.xpath( + "//img[@src[contains(.,'espncricinfo.com/inline/content')]]" + ).xpath("@src") + + yield PlayerItem( + name=name.get(), + role=role.get(), + image=image.get(), + ) diff --git a/espncricinfo/spiders/upcoming-spider.py b/espncricinfo/spiders/upcoming-spider.py new file mode 100755 index 00000000..304ceec5 --- /dev/null +++ b/espncricinfo/spiders/upcoming-spider.py @@ -0,0 +1,86 @@ +import scrapy +import datetime +import json +from espncricinfo.items import LiveMatchItem + + +class LiveSpider(scrapy.Spider): + + name = "espn-live" + allowed_domains = ["espncricinfo.com"] + + def start_requests(self): + return [ + scrapy.Request( + url="https://www.espncricinfo.com/live-cricket-match-schedule-fixtures", + callback=self.parse, + ) + ] + + def parse(self, response): + + matches = response.selector.xpath("//a[@class = 'match-info-link-FIXTURES']") + now = datetime.datetime.now().date() + + for match in matches: + + try: + if ( + datetime.datetime.strptime( + match.xpath("div/div/div/span/text()").get().split(",")[0], + "%d-%b-%Y", + ).date() + - now + ).days <= 7: + match_link = [ + match.xpath("@href").get() + for team_div in match.xpath( + "div/div/div[@class='teams']/div[@class='team']" + ) + if team_div.xpath("div/p/text()").get() + in [ + "India", + "Australia", + "England", + "Bangladesh", + "New Zealand", + "South Africa", + "Pakistan", + "Sri Lanka", + "West Indies", + "Afghanistan", + ] + ] + if match_link: + yield scrapy.Request( + url="https://www.espncricinfo.com/matches/engine/match/" + + match_link[0] + .split("/live-cricket-score")[0] + .split("-")[-1] + + ".json", + callback=self.parse_match, + ) + except ValueError: + pass + + def parse_match(self, response): + + match_data = json.loads(response.text) + team1_squad = [] + team2_squad = [] + for squad in match_data["team"][0]["squad"]: + team1_squad.append( + {"name": squad["card_long"], "player_id": squad["object_id"]} + ) + for squad in match_data["team"][1]["squad"]: + team2_squad.append({"name": squad["card_long"], "id": squad["object_id"]}) + + yield LiveMatchItem( + team1=match_data["match"]["team1_name"], + team2=match_data["match"]["team2_name"], + match_id=match_data["match"]["international_class_id"], + team1_squad=team1_squad, + team2_squad=team2_squad, + team1_id=match_data["match"]["team1_id"], + team2_id=match_data["match"]["team2_id"], + ) diff --git a/requirements.txt b/requirements.txt old mode 100644 new mode 100755 index 5a3d3ab1..50eea6c6 --- a/requirements.txt +++ b/requirements.txt @@ -1,4 +1,4 @@ sklearn==0.0 fastapi[all]==0.63.0 -pycricbuzz==2.4 scrapy==2.4 +scrapyrt==0.11.0 \ No newline at end of file diff --git a/scrapy.cfg b/scrapy.cfg old mode 100644 new mode 100755 index 83a4eef6..a5cd4ae5 --- a/scrapy.cfg +++ b/scrapy.cfg @@ -4,8 +4,9 @@ # https://scrapyd.readthedocs.io/en/latest/deploy.html [settings] -default = crawler.settings +default = espncricinfo.settings [deploy] #url = http://localhost:6800/ -project = crawler +project = espncricinfo + diff --git a/test/__init__.py b/test/__init__.py index 9102b2dc..e69de29b 100644 --- a/test/__init__.py +++ b/test/__init__.py @@ -1,7 +0,0 @@ -""" -Setting paths for testing -""" - -import sys - -sys.path.insert(1, "..") diff --git a/test/test_main.py b/test/test_main.py index 22ffacb3..970e1975 100644 --- a/test/test_main.py +++ b/test/test_main.py @@ -4,7 +4,7 @@ import os from fastapi.testclient import TestClient from app.main import app -from app.fantasy_cricket.utils import Matches +from app.fantasy_cricket.matches import Matches client = TestClient(app) cricket = Matches() @@ -16,21 +16,13 @@ def test_home(): assert response.status_code == 200 -def test_home_post(): - teams = [ - [match[0]["name"], match[1]["name"]] - for match in cricket.get_match() - ] - for team in teams: - response = client.post("/", data={"match": team[0]+" vs "+team[1]}) - assert response.status_code == 302 - def test_playing_11(): - teams = [ - [match[0]["name"], match[1]["name"]] - for match in cricket.get_match() - ] - for team in teams: - response = client.get("/playing11?team1="+team[0]+"&team2="+team[1], - data={"match": team[0]+" vs "+team[1]}) + + matches = cricket.get_upcoming_match() + for teams in matches: + response = client.get("/playing11?team1="+ teams["team1"] + "&team2=" + teams["team2"]) assert response.status_code == 200 + +def test_results(): + response = client.get("/results?match_type=1&team=India&team=England&player_team1=253802&player_team1=277916&player_team1=398438&player_team1=26421&player_team1=625383&player_team1=940973&player_team1=625371&player_team1=931581&player_team1=32540&player_team1=422108&player_team1=34102&player_team2=303669&player_team2=8917&player_team2=8608&player_team2=669855&player_team2=646847&player_team2=10617&player_team2=398778&player_team2=308967&player_team2=364788&player_team2=641423&player_team2=455524") + assert response.status_code == 200