Skip to content
This repository was archived by the owner on Jul 18, 2022. It is now read-only.

Commit 54b97e2

Browse files
author
Michael Oliver
committedApr 11, 2020
Added shop listing logic + startup event, tests, added update user roles/shops endpoint + me versions
1 parent 008ccd5 commit 54b97e2

18 files changed

+670
-79
lines changed
 

‎docker-compose.yml

+5
Original file line numberDiff line numberDiff line change
@@ -52,3 +52,8 @@ services:
5252
image: mailhog/mailhog:v1.0.0
5353
ports:
5454
- "8025:8025"
55+
56+
splash-browser:
57+
image: scrapinghub/splash
58+
ports:
59+
- "8050:8050"
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,27 @@
1+
"""Adding user shops relationship
2+
3+
Revision ID: daff23253894
4+
Revises: fab2a86c8b63
5+
Create Date: 2020-04-11 08:46:05.071956
6+
7+
"""
8+
import sqlalchemy as sa
9+
from alembic import op
10+
11+
# revision identifiers, used by Alembic.
12+
revision = "daff23253894"
13+
down_revision = "fab2a86c8b63"
14+
branch_labels = None
15+
depends_on = None
16+
17+
18+
def upgrade():
19+
# ### commands auto generated by Alembic - please adjust! ###
20+
pass
21+
# ### end Alembic commands ###
22+
23+
24+
def downgrade():
25+
# ### commands auto generated by Alembic - please adjust! ###
26+
pass
27+
# ### end Alembic commands ###
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,66 @@
1+
"""Adding user shops
2+
3+
Revision ID: fab2a86c8b63
4+
Revises: e7ff97c10b8f
5+
Create Date: 2020-04-11 08:44:40.315632
6+
7+
"""
8+
import sqlalchemy as sa
9+
from alembic import op
10+
11+
# revision identifiers, used by Alembic.
12+
revision = "fab2a86c8b63"
13+
down_revision = "e7ff97c10b8f"
14+
branch_labels = None
15+
depends_on = None
16+
17+
18+
def upgrade():
19+
# ### commands auto generated by Alembic - please adjust! ###
20+
op.create_table(
21+
"shop",
22+
sa.Column("id", sa.Integer(), nullable=False),
23+
sa.Column(
24+
"created_at",
25+
sa.TIMESTAMP(timezone=True),
26+
server_default=sa.text("now()"),
27+
nullable=True,
28+
),
29+
sa.Column("updated_at", sa.TIMESTAMP(timezone=True), nullable=True),
30+
sa.Column("name", sa.String(), nullable=False),
31+
sa.Column("url", sa.String(), nullable=False),
32+
sa.Column("query_url", sa.String(), nullable=False),
33+
sa.Column("render_javascript", sa.Boolean(), nullable=False),
34+
sa.Column("listing_page_selector", sa.JSON(), nullable=True),
35+
sa.PrimaryKeyConstraint("id"),
36+
sa.UniqueConstraint("name"),
37+
sa.UniqueConstraint("url"),
38+
)
39+
op.create_table(
40+
"user_shops",
41+
sa.Column("id", sa.Integer(), nullable=False),
42+
sa.Column(
43+
"created_at",
44+
sa.TIMESTAMP(timezone=True),
45+
server_default=sa.text("now()"),
46+
nullable=True,
47+
),
48+
sa.Column("updated_at", sa.TIMESTAMP(timezone=True), nullable=True),
49+
sa.Column("user_id", sa.Integer(), nullable=True),
50+
sa.Column("shop_id", sa.Integer(), nullable=True),
51+
sa.ForeignKeyConstraint(
52+
["shop_id"], ["shop.id"], onupdate="CASCADE", ondelete="CASCADE"
53+
),
54+
sa.ForeignKeyConstraint(
55+
["user_id"], ["user.id"], onupdate="CASCADE", ondelete="CASCADE"
56+
),
57+
sa.PrimaryKeyConstraint("id"),
58+
)
59+
# ### end Alembic commands ###
60+
61+
62+
def downgrade():
63+
# ### commands auto generated by Alembic - please adjust! ###
64+
op.drop_table("user_shops")
65+
op.drop_table("shop")
66+
# ### end Alembic commands ###

‎server/app/api/v1/dependencies/or_404.py

+18-2
Original file line numberDiff line numberDiff line change
@@ -2,8 +2,8 @@
22
from sqlalchemy import orm
33

44
from app.db.session import get_db
5-
from app.models import rolemodels, usermodels
6-
from app.service import roleservice, userservice
5+
from app.models import rolemodels, shopmodels, usermodels
6+
from app.service import roleservice, shopservice, userservice
77

88

99
def get_role_by_id_or_404(
@@ -51,3 +51,19 @@ def get_user_or_404(
5151
detail="Specified user was not found.",
5252
)
5353
return user
54+
55+
56+
def get_shop_or_404(
57+
db_session: orm.Session = Depends(get_db),
58+
shop_id: int = Path(..., alias="id", ge=1),
59+
) -> shopmodels.Shop:
60+
"""
61+
Route dependency that retrieves a shop by id or raises 404.
62+
"""
63+
shop = shopservice.get(db_session=db_session, id_=shop_id)
64+
if not shop:
65+
raise HTTPException(
66+
status_code=status.HTTP_404_NOT_FOUND,
67+
detail="Specified shop was not found.",
68+
)
69+
return shop

‎server/app/api/v1/routes/me.py

+41-3
Original file line numberDiff line numberDiff line change
@@ -1,11 +1,11 @@
11
from typing import List
22

3-
from fastapi import APIRouter, Depends, HTTPException, Path, status
3+
from fastapi import APIRouter, Body, Depends, HTTPException, Path, status
44
from sqlalchemy.orm import Session
55

66
from app.db.session import get_db
7-
from app.models import rolemodels, usermodels
8-
from app.service import userservice
7+
from app.models import rolemodels, shopmodels, usermodels
8+
from app.service import shopservice, userservice
99

1010
from ..dependencies.auth import get_current_active_user
1111

@@ -44,3 +44,41 @@ def read_current_user_roles(
4444
):
4545
"""Read the currently logged in user roles"""
4646
return current_user.roles
47+
48+
49+
@router.get(
50+
"/me/shops", response_model=List[shopmodels.ShopRead],
51+
)
52+
def read_current_user_shops(
53+
current_user: usermodels.User = Depends(get_current_active_user),
54+
):
55+
"""
56+
Retrieve a list of shops assigned to the currently logged in user.
57+
"""
58+
return current_user.shops
59+
60+
61+
@router.put(
62+
"/me/shops", response_model=List[shopmodels.ShopRead],
63+
)
64+
def update_user_shops(
65+
*,
66+
db_session: Session = Depends(get_db),
67+
current_user: usermodels.User = Depends(get_current_active_user),
68+
shops_ids: List[int] = Body(...),
69+
):
70+
"""
71+
Update the assigned shops of the currently logged in user.
72+
"""
73+
74+
shop_objs = shopservice.get_multiple_by_ids(db_session=db_session, ids_=shops_ids)
75+
76+
if len(shop_objs) != len(shops_ids):
77+
raise HTTPException(
78+
status_code=status.HTTP_404_NOT_FOUND,
79+
detail="One of the specified shops was not found man.",
80+
)
81+
82+
current_user.shops = shop_objs
83+
db_session.commit()
84+
return shop_objs

‎server/app/api/v1/routes/shops.py

+106
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,106 @@
1+
from typing import List, Set
2+
3+
from fastapi import APIRouter, Depends, HTTPException, Query, status
4+
from sqlalchemy import orm
5+
6+
from app.db.session import get_db
7+
from app.models import shopmodels
8+
from app.service import scraperservice, shopservice
9+
10+
from ..dependencies.auth import admin_role, user_role
11+
from ..dependencies.or_404 import get_shop_or_404
12+
13+
router = APIRouter()
14+
15+
16+
# Populate the scrapers into memory
17+
@router.on_event("startup")
18+
def populate_scrapers():
19+
from tests.common import SessionLocal
20+
21+
scraperservice.populate_scrapers(db_session=SessionLocal())
22+
23+
24+
@router.get(
25+
"/", response_model=List[shopmodels.ShopRead], dependencies=[Depends(user_role)]
26+
)
27+
def get_shops(*, db_session: orm.Session = Depends(get_db)):
28+
"""
29+
Retrieve a list of shops.
30+
"""
31+
return shopservice.get_multiple(db_session=db_session)
32+
33+
34+
@router.get("/{id}", response_model=shopmodels.ShopRead)
35+
def get_single_shop(shop: shopmodels.ShopRead = Depends(get_shop_or_404),):
36+
"""
37+
Retrieve details about a specific shop.
38+
"""
39+
return shop
40+
41+
42+
@router.post(
43+
"/",
44+
status_code=status.HTTP_201_CREATED,
45+
response_model=shopmodels.ShopRead,
46+
dependencies=[Depends(admin_role)],
47+
)
48+
def create_shop(
49+
*, db_session: orm.Session = Depends(get_db), shop_in: shopmodels.ShopCreate
50+
):
51+
"""
52+
Create a new shop.
53+
"""
54+
55+
if shopservice.get_by_name(db_session=db_session, name=shop_in.name):
56+
raise HTTPException(
57+
status_code=status.HTTP_400_BAD_REQUEST,
58+
detail="Shop with that name already exists",
59+
)
60+
return shopservice.create(db_session=db_session, shop_in=shop_in)
61+
62+
63+
@router.put(
64+
"/{id}", response_model=shopmodels.ShopRead, dependencies=[Depends(admin_role)]
65+
)
66+
def update_shop(
67+
*,
68+
db_session: orm.Session = Depends(get_db),
69+
shop_in: shopmodels.ShopUpdate,
70+
shop: shopmodels.Shop = Depends(get_shop_or_404),
71+
):
72+
"""
73+
Update an individual shop.
74+
"""
75+
76+
return shopservice.update(db_session=db_session, shop=shop, shop_in=shop_in)
77+
78+
79+
@router.delete(
80+
"/{id}", response_model=shopmodels.ShopRead, dependencies=[Depends(admin_role)]
81+
)
82+
def delete_shop(
83+
*,
84+
db_session: orm.Session = Depends(get_db),
85+
shop: shopmodels.Shop = Depends(get_shop_or_404),
86+
):
87+
"""
88+
Delete an individual shop.
89+
"""
90+
91+
return shopservice.delete(db_session=db_session, id_=shop.id)
92+
93+
94+
@router.get("/listings/", dependencies=[Depends(admin_role)])
95+
async def read_multiple_shops_listings(
96+
query: str = Query(..., description="The search term to query by."),
97+
limit: int = Query(10, description="The number of results to return.", ge=1, le=40),
98+
include: Set[int] = Query(..., description="Shop IDs to query for listings."),
99+
):
100+
"""
101+
Scrape multiple shops for listings in real time.
102+
"""
103+
104+
return await scraperservice.query_scrapers(
105+
query=query, limit=limit, include=include
106+
)

‎server/app/api/v1/routes/users.py

+37-3
Original file line numberDiff line numberDiff line change
@@ -4,8 +4,8 @@
44
from sqlalchemy.orm import Session
55

66
from app.db.session import get_db
7-
from app.models import rolemodels, usermodels
8-
from app.service import roleservice, userservice
7+
from app.models import rolemodels, shopmodels, usermodels
8+
from app.service import roleservice, shopservice, userservice
99

1010
from ..dependencies.or_404 import get_user_or_404
1111

@@ -110,5 +110,39 @@ def update_user_roles(
110110
detail="One of the specified roles was not found man. I don't know which one yet.",
111111
)
112112

113-
user.roles = [role_objs]
113+
user.roles = role_objs
114+
db_session.commit()
115+
116+
117+
@router.get(
118+
"/{id}/shops", response_model=List[shopmodels.ShopRead],
119+
)
120+
def read_user_shops(user: usermodels.User = Depends(get_user_or_404),):
121+
"""
122+
Retrieve a list of shops assigned to an individual user.
123+
"""
124+
return user.shops
125+
126+
127+
@router.put(
128+
"/{id}/shops", response_model=List[shopmodels.ShopRead],
129+
)
130+
def update_user_shops(
131+
*,
132+
db_session: Session = Depends(get_db),
133+
user: usermodels.User = Depends(get_user_or_404),
134+
shops_ids: List[int] = Body(...),
135+
):
136+
"""
137+
Update the assigned shops of an individual user.
138+
"""
139+
140+
shop_objs = shopservice.get_multiple_by_ids(db_session=db_session, ids_=shops_ids)
141+
if len(shops_ids) != len(shops_ids):
142+
raise HTTPException(
143+
status_code=status.HTTP_404_NOT_FOUND,
144+
detail="One of the specified shops was not found man.",
145+
)
146+
147+
user.roles = [shop_objs]
114148
db_session.commit()

‎server/app/api/v1/v1_router.py

+7-1
Original file line numberDiff line numberDiff line change
@@ -1,20 +1,26 @@
11
from fastapi import APIRouter, Depends
22

33
from .dependencies.auth import admin_role
4-
from .routes import auth, me, roles, users
4+
from .routes import auth, me, roles, shops, users
55

66
router = APIRouter()
7+
78
router.include_router(router=auth.router, prefix="/auth", tags=["auth"])
9+
810
router.include_router(router=me.router, tags=["self"])
11+
912
router.include_router(
1013
router=users.router,
1114
prefix="/users",
1215
tags=["users"],
1316
dependencies=[Depends(admin_role)],
1417
)
18+
1519
router.include_router(
1620
router=roles.router,
1721
prefix="/roles",
1822
tags=["roles"],
1923
dependencies=[Depends(admin_role)],
2024
)
25+
26+
router.include_router(router=shops.router, prefix="/shops", tags=["shops"])

‎server/app/db/initdb.py

+9-2
Original file line numberDiff line numberDiff line change
@@ -3,8 +3,8 @@
33
import yaml
44
from sqlalchemy import engine, orm
55

6-
from app.models import rolemodels, usermodels
7-
from app.service import roleservice, userservice
6+
from app.models import rolemodels, shopmodels, usermodels
7+
from app.service import roleservice, shopservice, userservice
88
from app.settings import settings
99

1010
INITDB_PATH = settings.APP_DIR / "db" / "initdb.yaml"
@@ -14,6 +14,7 @@
1414

1515
def initdb(db_session: orm.Session):
1616
init_roles(db_session=db_session)
17+
init_shops(db_session=db_session)
1718

1819

1920
def init_roles(db_session: orm.Session):
@@ -24,6 +25,12 @@ def init_roles(db_session: orm.Session):
2425
roleservice.create_multiple(db_session=db_session, roles_in=roles_in)
2526

2627

28+
def init_shops(db_session: orm.Session):
29+
for shop in config["shops"]:
30+
shop_in = shopmodels.ShopCreate(**shop)
31+
shopservice.create(db_session=db_session, shop_in=shop_in)
32+
33+
2734
def setup_guids_postgresql(engine: engine.Engine) -> None: # pragma: no cover
2835
"""
2936
Set up UUID generation using the pgcrypto extension for postgres

‎server/app/db/initdb.yaml

+193
Original file line numberDiff line numberDiff line change
@@ -3,3 +3,196 @@ roles:
33
description: Permits administrator privileges.
44
- name: user
55
description: Normal user privileges.
6+
7+
shops:
8+
9+
- url: www.aldi.co.uk
10+
name: aldi
11+
query_url: /search?category=ALL&text={query}
12+
render_javascript: false
13+
listing_page_selector:
14+
items:
15+
css: 'div.hover-item:nth-of-type(n+6)'
16+
multiple: true
17+
type: Text
18+
children:
19+
url:
20+
css: a.category-item__wrapper-link
21+
type: Link
22+
name:
23+
css: 'ul.category-item__meta li.category-item__title'
24+
type: Text
25+
price:
26+
css: 'ul.category-item__meta.list-unstyled > a > li'
27+
type: Text
28+
price_per_unit:
29+
css: a.category-item__wrapper-link
30+
type: Attribute
31+
attribute: category-item__pricePerUnit
32+
image_url:
33+
css: 'a.category-item__link picture.category-item__image source:first-of-type'
34+
type: Attribute
35+
attribute: srcset
36+
37+
- url: www.amazon.co.uk
38+
name: amazon_pantry
39+
query_url: /s?k={query}&i=pantry
40+
render_javascript: false
41+
listing_page_selector:
42+
items:
43+
css: '#search div.s-result-item'
44+
multiple: true
45+
type: Text
46+
children:
47+
price:
48+
css: span.a-offscreen
49+
type: Text
50+
name:
51+
css: h2
52+
type: Text
53+
url:
54+
css: a
55+
type: Link
56+
image_url:
57+
css: img.s-image
58+
type: Attribute
59+
attribute: src
60+
price_per_unit:
61+
css: span.a-size-base.a-color-secondary
62+
type: Text
63+
64+
- url: groceries.asda.com
65+
name: asda
66+
query_url: /search/{query}
67+
render_javascript: true
68+
listing_page_selector:
69+
items:
70+
css: 'section.products-tab li.co-item'
71+
multiple: true
72+
type: Text
73+
children:
74+
price:
75+
css: strong.co-product__price
76+
type: Text
77+
price_per_unit:
78+
css: span.co-product__price-per-uom
79+
type: Text
80+
name:
81+
css: a.co-product__anchor
82+
type: Text
83+
url:
84+
css: a.co-product__anchor
85+
type: Link
86+
image_url:
87+
css: img.co-product__image
88+
type: Attribute
89+
attribute: src
90+
91+
- url: www.iceland.co.uk
92+
name: iceland
93+
query_url: /search?q={query}
94+
render_javascript: false
95+
listing_page_selector:
96+
items:
97+
css: 'ul.search-result-items div.product-tile'
98+
multiple: true
99+
type: Text
100+
children:
101+
name:
102+
css: 'a.name-link span'
103+
type: Text
104+
price:
105+
css: 'span.product-sales-price span'
106+
type: Text
107+
price_per_unit:
108+
css: div.product-pricing-info
109+
type: Text
110+
image_url:
111+
css: img.thumb-link
112+
type: Attribute
113+
attribute: src
114+
url:
115+
css: 'div.product-image a.thumb-link'
116+
type: Attribute
117+
attribute: href
118+
119+
- url: groceries.morrisons.com
120+
name: morrisons
121+
query_url: /search?entry={query}
122+
render_javascript: false
123+
listing_page_selector:
124+
items:
125+
css: 'ul.fops.fops-regular li.fops-item:nth-of-type(n+1)'
126+
multiple: true
127+
type: Text
128+
children:
129+
price:
130+
css: span.fop-price
131+
type: Text
132+
name:
133+
css: h4.fop-title
134+
type: Text
135+
price_per_unit:
136+
css: span.fop-unit-price
137+
type: Text
138+
image_url:
139+
css: img.fop-img
140+
type: Attribute
141+
attribute: src
142+
url:
143+
css: div.fop-contentWrapper
144+
type: Link
145+
146+
- url: www.sainsburys.co.uk
147+
name: sainsburys
148+
query_url: /webapp/wcs/stores/servlet/SearchDisplayView?storeId=10151&orderBy=RELEVANCE&searchTerm={query}
149+
render_javascript: false
150+
listing_page_selector:
151+
items:
152+
css: 'div.section li.gridItem'
153+
multiple: true
154+
type: Text
155+
children:
156+
url:
157+
css: 'h3 a'
158+
type: Link
159+
name:
160+
css: h3
161+
type: Text
162+
price:
163+
css: p.pricePerUnit
164+
type: Text
165+
price_per_unit:
166+
css: p.pricePerMeasure
167+
type: Text
168+
image_url:
169+
css: 'h3 img'
170+
type: Attribute
171+
attribute: src
172+
173+
- url: www.tesco.com
174+
name: tesco
175+
query_url: /groceries/en-GB/search?query={query}
176+
render_javascript: false
177+
listing_page_selector:
178+
items:
179+
css: li.product-list--list-item
180+
multiple: true
181+
type: Text
182+
children:
183+
url:
184+
css: a.sc-kAzzGY
185+
type: Link
186+
name:
187+
css: div.product-details--content
188+
type: Text
189+
price:
190+
css: 'div.price-per-sellable-unit div'
191+
type: Text
192+
price_per_unit:
193+
css: div.price-per-quantity-weight
194+
type: Text
195+
image_url:
196+
css: img.product-image
197+
type: Attribute
198+
attribute: src

‎server/app/models/__init__.py

+1-1
Original file line numberDiff line numberDiff line change
@@ -3,5 +3,5 @@
33
"""
44

55
from .rolemodels import *
6-
from .usermodels import *
76
from .shopmodels import *
7+
from .usermodels import *

‎server/app/models/shopmodels.py

+1-1
Original file line numberDiff line numberDiff line change
@@ -42,7 +42,7 @@ class ShopCreate(PydanticBase):
4242
class ShopRead(PydanticTS, ShopCreate):
4343
"""Attributes to return via API"""
4444

45-
pass
45+
id: int
4646

4747

4848
class ShopUpdate(PydanticBase):

‎server/app/models/usermodels.py

+1-1
Original file line numberDiff line numberDiff line change
@@ -23,7 +23,7 @@ class User(SQLAlchemyTS, SQLAlchemyIntPK, SQLAlchemyBase):
2323

2424
# Relationships
2525
roles = relationship("Role", secondary="user_roles")
26-
# shops = relationship("Shop", secondary="user_shops")
26+
shops = relationship("Shop", secondary="user_shops")
2727

2828
@property
2929
def role_names(self) -> List[str]:

‎server/app/service/scraperservice.py

+21-64
Original file line numberDiff line numberDiff line change
@@ -3,53 +3,49 @@
33
from typing import Set
44

55
import httpx
6-
import pyppeteer
76
import selectorlib
8-
from app.core.settings import settings
9-
from app.crud import shop_crud
10-
from app.schemas.shop import ShopConfigurationDB
7+
from sqlalchemy import orm
8+
9+
from app.models import shopmodels
10+
from app.service import shopservice
11+
from app.settings import settings
1112

1213
logger = logging.getLogger(__name__)
1314

1415

1516
class Scraper:
16-
def __init__(self, config: ShopConfigurationDB) -> None:
17+
def __init__(self, shop: shopmodels.ShopRead) -> None:
1718
self.protocol = "https"
18-
self._config = config
19-
self.base_url = f"{self.protocol}://{self._config.url}"
20-
self.name = self._config.name
19+
self._shop = shop
20+
self.base_url = f"{self.protocol}://{self._shop.url}"
21+
self.name = self._shop.name
2122

2223
# Create Extractor for listing page
2324
self._listing_page_extractor = selectorlib.Extractor(
24-
self._config.listing_page_selector
25+
self._shop.listing_page_selector
2526
)
2627

2728
def __repr__(self) -> str:
2829
return f"Scraper(name={self.name}, base_url={self.base_url})"
2930

3031
def _build_query_url(self, q: str) -> str:
31-
return self.base_url + self._config.query_url.format(query=q)
32+
return self.base_url + self._shop.query_url.format(query=q)
3233

3334
async def query_listings(
3435
self, client: httpx.AsyncClient, query: str, limit: int = 10
3536
) -> dict:
3637

3738
url = self._build_query_url(query)
38-
39-
# Render page with `pyppeteer` if needed
40-
if self._config.render_javascript:
41-
html = await render_page(url=url)
42-
else:
43-
html = await fetch_page(url=url, client=client)
39+
html = await fetch_page(url=url, client=client)
4440

4541
results = self._listing_page_extractor.extract(
4642
html, base_url=self.base_url
4743
).get("items")
4844
if results:
4945
results = results[:limit]
5046
response_object = {
51-
"id": self._config.id,
52-
"name": self._config.name,
47+
"id": self._shop.id,
48+
"name": self._shop.name,
5349
"listings": results,
5450
}
5551
return response_object
@@ -62,32 +58,11 @@ async def fetch_page(url: str, client: httpx.AsyncClient):
6258
return html
6359

6460

65-
async def render_page(url: str) -> str:
66-
"""
67-
Using ``pyppeteer`` load a web page and return HTML content.
68-
"""
69-
options = {
70-
"timeout": int(settings.scraper.PYPPETEER_TIMEOUT * 1000),
71-
"waitUntil": "domcontentloaded",
72-
}
73-
browser = await pyppeteer.launch(
74-
executablePath=settings.CHROME_BIN, ignoreHTTPSErrors=True, headless=True
75-
)
76-
page = await browser.newPage()
77-
await page.goto(url, options=options)
78-
await asyncio.sleep(settings.scraper.PYPPETEER_SLEEP)
79-
html = await page.content()
80-
await browser.close()
81-
return html
82-
83-
8461
async def query_scrapers(query: str, limit: int, include: Set[int]):
8562
"""Query scrapers entry point."""
8663

8764
# Only use one client for all requests
88-
async with httpx.AsyncClient(
89-
verify=False, timeout=settings.scraper.HTTPCLIENT_TIMEOUT
90-
) as client:
65+
async with httpx.AsyncClient(verify=False,) as client:
9166
tasks = [
9267
scrapers[i].query_listings(client=client, query=query, limit=limit)
9368
for i in include
@@ -99,31 +74,13 @@ async def query_scrapers(query: str, limit: int, include: Set[int]):
9974
scrapers = {}
10075

10176

102-
async def initialise():
77+
def populate_scrapers(db_session: orm.Session):
10378
"""
104-
Reads all shop configurations from database and using each config initialise's a `Scraper` instance.
105-
Local scraper dict is then used for quick lookup. Key is scraper id and value is `Scraper` instance.
106-
Should be called every time new configurations are added to db.
79+
Populate scraper configuration into memory for fast lookup.
10780
"""
10881
global scrapers
10982
scrapers = {}
110-
shops = await shop_crud.read_all()
111-
for s in shops:
112-
scrapers[s["id"]] = Scraper(config=ShopConfigurationDB(**s))
113-
114-
115-
# async def initialise():
116-
# global scrapers
117-
# """Reads scraper information from /etc and populates the database with shop configs."""
118-
#
119-
# with open(settings.SHOPS_YAML_PATH) as fileobj:
120-
# shopsconfig = yaml.safe_load_all(fileobj.read())
121-
#
122-
# global scrapers
123-
# for config in shopsconfig:
124-
# shop = await shop_crud.read_by_name(config["name"])
125-
# if not shop:
126-
# logger.info(f"Shop not found adding: {config['name']}")
127-
# shop = await shop_crud.create(ShopConfigurationSchema(**config))
128-
#
129-
# scrapers[shop["id"]] = Scraper(config=ShopConfigurationDB(**shop))
83+
shops = shopservice.get_multiple(db_session=db_session)
84+
for shop in shops:
85+
shop_model = shopmodels.ShopRead.from_orm(shop)
86+
scrapers[shop.id] = Scraper(shop_model)

‎server/manage.py

+3-1
Original file line numberDiff line numberDiff line change
@@ -5,7 +5,7 @@
55
import typer
66
from tabulate import tabulate
77

8-
from app.db.initdb import initdb
8+
from app.db.initdb import init_shops
99
from app.enums import logenums, userenums
1010
from app.main import app
1111
from app.models import rolemodels, usermodels
@@ -311,6 +311,8 @@ def seeddb():
311311
role=admin_role,
312312
)
313313

314+
init_shops(db_session=db_session)
315+
314316
typer.echo(Messages.success)
315317

316318

‎server/tests/api/v1/test_me.py

+12
Original file line numberDiff line numberDiff line change
@@ -1,6 +1,8 @@
11
import pytest
22
from fastapi.testclient import TestClient
33

4+
from tests import factories
5+
46

57
def test_read_me(user_role_client: TestClient):
68
url = "/api/v1/me"
@@ -53,3 +55,13 @@ def test_read_me_roles(user_role_client: TestClient):
5355

5456
roles = resp.json()
5557
assert roles[0]["name"] == "user"
58+
59+
60+
def test_update_me_shops(user_role_client: TestClient):
61+
shops = [factories.ShopFactory(), factories.ShopFactory()]
62+
shop_ids = [shop.id for shop in shops]
63+
64+
url = "/api/v1/me/shops"
65+
66+
resp = user_role_client.put(url=url, json=shop_ids)
67+
assert resp.status_code == 200, resp.text

‎server/tests/api/v1/test_shops.py

+104
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,104 @@
1+
import pytest
2+
from fastapi.testclient import TestClient
3+
4+
from tests.factories import ShopFactory
5+
6+
7+
def test_read_many(user_role_client: TestClient):
8+
"""
9+
Test reading many shops.
10+
"""
11+
12+
# Create some shops in the db first
13+
ShopFactory()
14+
ShopFactory()
15+
ShopFactory()
16+
17+
url = "/api/v1/shops/"
18+
resp = user_role_client.get(url=url)
19+
assert resp.status_code == 200, resp.json()
20+
data = resp.json()
21+
assert isinstance(data, list)
22+
assert len(data) >= 1
23+
24+
25+
def test_read(admin_role_client: TestClient):
26+
"""
27+
Test getting a shop.
28+
"""
29+
30+
# Create a shop to read first
31+
db_shop = ShopFactory()
32+
33+
shop_id = db_shop.id
34+
url = f"/api/v1/shops/{shop_id}"
35+
resp = admin_role_client.get(url)
36+
assert resp.status_code == 200, resp.text
37+
38+
39+
@pytest.mark.parametrize("user_id", [999, 0, -1, "g"])
40+
def test_read_invalid_id(admin_role_client: TestClient, user_id):
41+
"""
42+
Test getting a shop with an invalid id.
43+
"""
44+
45+
# Create a user to read first
46+
url = f"/api/v1/users/{user_id}"
47+
resp = admin_role_client.get(url)
48+
assert resp.status_code in [404, 422]
49+
50+
51+
def test_create(admin_role_client: TestClient):
52+
"""
53+
Test creating a shop.
54+
"""
55+
url = "/api/v1/shops/"
56+
data = {
57+
"name": "tesco",
58+
"url": "www.tesco.com",
59+
"query_url": "/groceries/en-GB/search?query={query}",
60+
"render_javascript": False,
61+
"listing_page_selector": {},
62+
}
63+
64+
resp = admin_role_client.post(url, json=data)
65+
assert resp.status_code == 201, resp.text
66+
67+
68+
def test_create_existing_name(admin_role_client: TestClient):
69+
"""
70+
Test creating a shop with an already existing name.
71+
"""
72+
db_shop = ShopFactory()
73+
name = db_shop.name
74+
url = "/api/v1/shops/"
75+
data = {
76+
"name": name,
77+
"url": "www.tesco.com",
78+
"query_url": "/groceries/en-GB/search?query={query}",
79+
"render_javascript": False,
80+
"listing_page_selector": {},
81+
}
82+
83+
resp = admin_role_client.post(url, json=data)
84+
assert resp.status_code == 400, resp.text
85+
86+
87+
def test_delete(admin_role_client: TestClient):
88+
"""
89+
Test deleting a user.
90+
"""
91+
92+
# Create one to delete first
93+
db_shop = ShopFactory()
94+
95+
id_ = db_shop.id
96+
97+
# Delete the shop
98+
url = f"/api/v1/shops/{id_}"
99+
resp = admin_role_client.delete(url)
100+
assert resp.status_code == 200
101+
102+
# Ensure user has been deleted from the database
103+
resp = admin_role_client.get(url)
104+
assert resp.status_code == 404

‎server/tests/api/v1/test_users.py

+18
Original file line numberDiff line numberDiff line change
@@ -1,6 +1,8 @@
11
import pytest
22
from fastapi.testclient import TestClient
33

4+
from tests import factories
5+
46

57
@pytest.mark.parametrize(
68
"url, method",
@@ -155,3 +157,19 @@ def test_delete(admin_role_client: TestClient):
155157
# Ensure user has been deleted from the database
156158
resp = admin_role_client.get(url)
157159
assert resp.status_code == 404
160+
161+
162+
def test_update_user_roles(admin_role_client: TestClient):
163+
164+
# Create some roles in the db first
165+
roles = [factories.RoleFactory(), factories.RoleFactory()]
166+
role_ids = [role.id for role in roles]
167+
168+
# Create a user to assign the roles
169+
user = factories.UserFactory()
170+
user_id = user.id
171+
172+
url = f"/api/v1/users/{user_id}/roles"
173+
174+
resp = admin_role_client.put(url=url, json=role_ids)
175+
assert resp.status_code == 200, resp.text

0 commit comments

Comments
 (0)
This repository has been archived.