12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970 |
- """API module"""
- import re
- from datetime import datetime, date, timedelta
- import requests
- from bs4 import BeautifulSoup
- from app import BASE_URL, HEADERS
- TYPES = {
- 'yellow': 1,
- 'oil': 2,
- 'ore': 5,
- 'uranium': 11,
- 'diamond': 15,
- }
- def get_factories(region_id):
- """Get factories from state"""
- # return read_factories()
- return download_factories(region_id)
- def read_factories():
- """Read factories file"""
- with open('factories_4001.html') as file:
- factories, more = parse_factories(file, 4001)
- return factories
- def download_factories(region_id):
- """Download the factories"""
- factories = []
- more = True
- page = 0
- while more:
- response = requests.get(
- '{}factory/search/{}/0/0/{}'.format(BASE_URL, region_id, page*25),
- headers=HEADERS
- )
- tmp_factories, more = parse_factories(response.text, region_id)
- factories = factories + tmp_factories
- page += 1
- return factories
- def parse_factories(html, region_id):
- """Parse html return factories"""
- soup = BeautifulSoup(html, 'html.parser')
- factories_tree = soup.find_all(class_='list_link')
- factories = []
- for factory_tree in factories_tree:
- columns = factory_tree.find_all('td')
- factories.append({
- 'region_id': region_id,
- 'id': int(factory_tree['user']),
- 'name': columns[1].contents[0].strip(),
- 'level': int(columns[2].string),
- 'workers': int(re.sub(r'\/[0-9]*$', '', columns[3].string)),
- 'wage': int(columns[4].string.replace('%', '')),
- 'experience': int(columns[5].string),
- })
- return factories, bool(len(factories_tree) >= 25)
- def parse_date(date_string):
- """Parse date to object"""
- if 'Today' in date_string:
- return date.today()
- if 'Yesterday' in date_string:
- return date.today() - timedelta(1)
- return datetime.strptime(date_string, '%d %B %Y').date()
|