Skip to content
New issue

Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.

By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.

Already on GitHub? Sign in to your account

feat: remove s3 file from annotations and use an observation array in… #28

Open
wants to merge 24 commits into
base: main
Choose a base branch
from
Open
Show file tree
Hide file tree
Changes from all commits
Commits
Show all changes
24 commits
Select commit Hold shift + click to select a range
bc98566
feat: remove s3 file from annotations and use an observation array in…
Nastaliss Jun 24, 2023
ae0ed9b
fix: image path
Nastaliss Apr 1, 2024
ceec8b5
feat: add correct tests for annotations and observations
Nastaliss Apr 1, 2024
3acab3b
feat: sort types
Nastaliss Apr 1, 2024
c1d8d3c
feat: update only observations
Nastaliss Apr 1, 2024
a7496a3
test: build docker wait for probing doc
Nastaliss Apr 1, 2024
d26245c
feat: add health-check
Nastaliss Apr 1, 2024
20f218e
feat: remove hc on backend;
Nastaliss Apr 1, 2024
620934b
feat: hard-code env vars for db
Nastaliss Apr 1, 2024
6b27953
feat: wait for condition healthy
Nastaliss Apr 1, 2024
5d89bf5
feat: add health-checks in dev
Nastaliss Apr 1, 2024
5267883
feat: lint
Nastaliss Apr 1, 2024
62c4f9f
chore: retrigger ci
Nastaliss Jul 1, 2024
212cda3
chore(deps): Bump certifi from 2022.12.7 to 2023.7.22 (#29)
dependabot[bot] Aug 15, 2023
ee5f16e
chore(deps): Bump gitpython from 3.1.31 to 3.1.34 (#31)
dependabot[bot] Sep 16, 2023
b746327
chore(deps): Bump gitpython from 3.1.34 to 3.1.35 (#32)
dependabot[bot] Sep 16, 2023
64941bd
feat: Enables CORS using FastAPI middleware (#26)
frgfm Sep 16, 2023
a6df74b
chore(deps): Bump urllib3 from 1.26.15 to 1.26.17 (#33)
dependabot[bot] Oct 8, 2023
90d0326
chore(deps): Bump gitpython from 3.1.35 to 3.1.37 (#34)
dependabot[bot] Oct 18, 2023
ebc4104
chore(deps): Bump urllib3 from 1.26.17 to 1.26.18 (#35)
dependabot[bot] Oct 18, 2023
0acfed9
fix: use string as json key
Nastaliss Jul 1, 2024
43e4a50
fix: no explicit none
Nastaliss Jul 1, 2024
0c1f2f2
Merge branch 'main' into simplify-annotations
Nastaliss Jul 6, 2024
793a7bb
Merge remote-tracking branch 'origin/main' into simplify-annotations
Nastaliss Jul 6, 2024
File filter

Filter by extension

Filter by extension


Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
11 changes: 5 additions & 6 deletions .github/workflows/builds.yml
Original file line number Diff line number Diff line change
Expand Up @@ -29,12 +29,11 @@ jobs:
S3_SECRET_KEY: ${{ secrets.S3_SECRET_KEY }}
S3_REGION: ${{ secrets.S3_REGION }}
S3_ENDPOINT_URL: ${{ secrets.S3_ENDPOINT_URL }}
run: docker-compose up -d --build
- name: Docker sanity check
run: sleep 20 && nc -vz localhost 8080
- name: Ping server
run: curl http://localhost:8080/docs

run: |
docker compose up -d --build --wait
docker compose logs backend
nc -vz localhost 8080
curl http://localhost:8080/docs
client:
runs-on: ${{ matrix.os }}
strategy:
Expand Down
1 change: 1 addition & 0 deletions client/docs/source/conf.py
Original file line number Diff line number Diff line change
Expand Up @@ -104,6 +104,7 @@
# so a file named "default.css" will overwrite the builtin "default.css".
html_static_path = ["_static"]


# Add googleanalytics id
# ref: https://github.com/orenhecht/googleanalytics/blob/master/sphinxcontrib/googleanalytics.py
def add_ga_javascript(app, pagename, templatename, context, doctree):
Expand Down
47 changes: 16 additions & 31 deletions client/pyrostorage/client.py
Original file line number Diff line number Diff line change
Expand Up @@ -5,7 +5,7 @@

import io
import logging
from typing import Dict
from typing import Dict, List
from urllib.parse import urljoin

import requests
Expand All @@ -29,8 +29,7 @@
# ANNOTATIONS
#################
"create-annotation": "/annotations",
"upload-annotation": "/annotations/{annotation_id}/upload",
"get-annotation-url": "/annotations/{annotation_id}/url",
"update-annotation": "/annotations/{annotation_id}",
}


Expand Down Expand Up @@ -129,7 +128,7 @@ def get_media_url(self, media_id: int) -> Response:

return requests.get(self.routes["get-media-url"].format(media_id=media_id), headers=self.headers)

def create_annotation(self, media_id: int) -> Response:
def create_annotation(self, media_id: int, observations: List[str]) -> Response:
"""Create an annotation entry

Example::
Expand All @@ -139,49 +138,35 @@ def create_annotation(self, media_id: int) -> Response:

Args:
media_id: the identifier of the media entry
observations: list of observations

Returns:
HTTP response containing the created annotation
"""

return requests.post(self.routes["create-annotation"], headers=self.headers, json={"media_id": media_id})

def upload_annotation(self, annotation_id: int, annotation_data: bytes) -> Response:
"""Upload the annotation content

Example::
>>> from pyrostorage import client
>>> api_client = client.Client("http://pyro-storage.herokuapp.com", "MY_LOGIN", "MY_PWD")
>>> with open("path/to/my/file.ext", "rb") as f: data = f.read()
>>> response = api_client.upload_annotation(annotation_id=1, annotation_data=data)

Args:
annotation_id: ID of the associated annotation entry
annotation_data: byte data

Returns:
HTTP response containing the updated annotation
"""

return requests.post(
self.routes["upload-annotation"].format(annotation_id=annotation_id),
self.routes["create-annotation"],
headers=self.headers,
files={"file": io.BytesIO(annotation_data)},
json={"media_id": media_id, "observations": observations},
)

def get_annotation_url(self, annotation_id: int) -> Response:
"""Get the image as a URL
def update_annotation(self, annotation_id: int, observations: List[str]) -> Response:
"""Update an annotation entry

Example::
>>> from pyrostorage import client
>>> api_client = client.Client("http://pyro-storage.herokuapp.com", "MY_LOGIN", "MY_PWD")
>>> response = api_client.get_annotation_url(1)
>>> response = api_client.update_annotation(media_id=1)

Args:
annotation_id: the identifier of the annotation entry
observations: list of observations

Returns:
HTTP response containing the URL to the annotation content
HTTP response containing the updated annotation
"""

return requests.get(self.routes["get-annotation-url"].format(annotation_id=annotation_id), headers=self.headers)
return requests.post(
f'self.routes["update-annotation"]/{annotation_id}',
headers=self.headers,
json={"observations": observations},
)
2 changes: 1 addition & 1 deletion client/tests/test_client.py
Original file line number Diff line number Diff line change
Expand Up @@ -30,7 +30,7 @@ def test_client():
# Media
media_id = _test_route_return(api_client.create_media(media_type="image"), dict, 201)["id"]
# Annotation
_test_route_return(api_client.create_annotation(media_id=media_id), dict, 201)["id"]
_test_route_return(api_client.create_annotation(media_id=media_id, observations=["smoke", "fire"]), dict, 201)["id"]

# Check token refresh
prev_headers = deepcopy(api_client.headers)
Expand Down
10 changes: 10 additions & 0 deletions docker-compose-dev.yml
Original file line number Diff line number Diff line change
Expand Up @@ -23,6 +23,11 @@ services:
- S3_ENDPOINT_URL=${S3_ENDPOINT_URL}
depends_on:
- db
healthcheck:
test: ['CMD-SHELL', 'nc -vz localhost 8080']
interval: 10s
timeout: 3s
retries: 3
db:
image: postgres:15-alpine
volumes:
Expand All @@ -33,6 +38,11 @@ services:
- POSTGRES_USER=dummy_pg_user
- POSTGRES_PASSWORD=dummy_pg_pwd
- POSTGRES_DB=dummy_pg_db
healthcheck:
test: ['CMD-SHELL', "sh -c 'pg_isready -U dummy_pg_user -d dummy_pg_db'"]
interval: 10s
timeout: 3s
retries: 3
proxy:
build: nginx
ports:
Expand Down
20 changes: 12 additions & 8 deletions docker-compose.yml
Original file line number Diff line number Diff line change
Expand Up @@ -18,8 +18,14 @@ services:
- S3_SECRET_KEY=${S3_SECRET_KEY}
- S3_REGION=${S3_REGION}
- S3_ENDPOINT_URL=${S3_ENDPOINT_URL}
healthcheck:
test: ['CMD-SHELL', 'nc -vz localhost 8080']
interval: 10s
timeout: 3s
retries: 3
depends_on:
- db
db:
condition: service_healthy
db:
image: postgres:15-alpine
volumes:
Expand All @@ -30,13 +36,11 @@ services:
- POSTGRES_USER=dummy_pg_user
- POSTGRES_PASSWORD=dummy_pg_pwd
- POSTGRES_DB=dummy_pg_db
nginx:
build: nginx
ports:
- 80:80
- 443:443
depends_on:
- backend
healthcheck:
test: ['CMD-SHELL', "sh -c 'pg_isready -U dummy_pg_user -d dummy_pg_db'"]
interval: 10s
timeout: 3s
retries: 3

volumes:
postgres_data:
2 changes: 1 addition & 1 deletion src/Dockerfile-dev
Original file line number Diff line number Diff line change
@@ -1,4 +1,4 @@
FROM pyrostorage:python3.8-alpine3.10
FROM pyronear/storage-api:python3.8-alpine3.10

# copy requirements file
COPY requirements-dev.txt requirements-dev.txt
Expand Down
78 changes: 5 additions & 73 deletions src/app/api/routes/annotations.py
Original file line number Diff line number Diff line change
Expand Up @@ -5,15 +5,13 @@

from typing import Any, Dict, List

from fastapi import APIRouter, BackgroundTasks, File, HTTPException, Path, Security, UploadFile, status
from fastapi import APIRouter, Path, Security, status

from app.api import crud
from app.api.crud.authorizations import check_access_read, is_admin_access
from app.api.deps import get_current_access
from app.api.schemas import AccessType, AnnotationCreation, AnnotationIn, AnnotationOut, AnnotationUrl
from app.api.security import hash_content_file
from app.api.schemas import AccessType, AnnotationIn, AnnotationOut, AnnotationUpdateIn
from app.db import annotations
from app.services import resolve_bucket_key, s3_bucket

router = APIRouter()

Expand All @@ -33,7 +31,7 @@ async def create_annotation(
payload: AnnotationIn, _=Security(get_current_access, scopes=[AccessType.admin, AccessType.user])
):
"""
Creates an annotation related to specific media, based on media_id as argument
Creates an annotation related to specific media, based on media_id as argument, and with as many observations as needed

Below, click on "Schema" for more detailed information about arguments
or "Example Value" to get a concrete idea of arguments
Expand Down Expand Up @@ -66,9 +64,9 @@ async def fetch_annotations(
return []


@router.put("/{annotation_id}/", response_model=AnnotationOut, summary="Update information about a specific annotation")
@router.put("/{annotation_id}/", response_model=AnnotationOut, summary="Update observations on a specific annotation")
async def update_annotation(
payload: AnnotationIn,
payload: AnnotationUpdateIn,
annotation_id: int = Path(..., gt=0),
_=Security(get_current_access, scopes=[AccessType.admin]),
):
Expand All @@ -86,69 +84,3 @@ async def delete_annotation(
Based on a annotation_id, deletes the specified annotation
"""
return await crud.delete_entry(annotations, annotation_id)


@router.post("/{annotation_id}/upload", response_model=AnnotationOut, status_code=200)
async def upload_annotation(
background_tasks: BackgroundTasks,
annotation_id: int = Path(..., gt=0),
file: UploadFile = File(...),
):
"""
Upload a annotation (image or video) linked to an existing annotation object in the DB
"""

# Check in DB
entry = await check_annotation_registration(annotation_id)

# Concatenate the first 32 chars (to avoid system interactions issues) of SHA256 hash with file extension
file_hash = hash_content_file(file.file.read())
file_name = f"{file_hash[:32]}.{file.filename.rpartition('.')[-1]}"
# Reset byte position of the file (cf. https://fastapi.tiangolo.com/tutorial/request-files/#uploadfile)
await file.seek(0)
# Use MD5 to verify upload
md5_hash = hash_content_file(file.file.read(), use_md5=True)
await file.seek(0)
# If files are in a subfolder of the bucket, prepend the folder path
bucket_key = resolve_bucket_key(file_name, "annotations")

# Upload if bucket_key is different (otherwise the content is the exact same)
if isinstance(entry["bucket_key"], str) and entry["bucket_key"] == bucket_key:
return await crud.get_entry(annotations, annotation_id)
else:
# Failed upload
if not await s3_bucket.upload_file(bucket_key=bucket_key, file_binary=file.file):
raise HTTPException(status_code=status.HTTP_500_INTERNAL_SERVER_ERROR, detail="Failed upload")
# Data integrity check
file_meta = await s3_bucket.get_file_metadata(bucket_key)
# Corrupted file
if md5_hash != file_meta["ETag"].replace('"', ""):
# Delete the corrupted upload
await s3_bucket.delete_file(bucket_key)
# Raise the exception
raise HTTPException(
status_code=status.HTTP_500_INTERNAL_SERVER_ERROR,
detail="Data was corrupted during upload",
)
# If a file was previously uploaded, delete it
if isinstance(entry["bucket_key"], str):
await s3_bucket.delete_file(entry["bucket_key"])

entry_dict = dict(**entry)
entry_dict["bucket_key"] = bucket_key
return await crud.update_entry(annotations, AnnotationCreation(**entry_dict), annotation_id)


@router.get("/{annotation_id}/url", response_model=AnnotationUrl, status_code=200)
async def get_annotation_url(
annotation_id: int = Path(..., gt=0),
requester=Security(get_current_access, scopes=[AccessType.admin, AccessType.user]),
):
"""Resolve the temporary media image URL"""
await check_access_read(requester.id)

# Check in DB
annotation_instance = await check_annotation_registration(annotation_id)
# Check in bucket
temp_public_url = await s3_bucket.get_public_url(annotation_instance["bucket_key"])
return AnnotationUrl(url=temp_public_url)
11 changes: 4 additions & 7 deletions src/app/api/schemas.py
Original file line number Diff line number Diff line change
Expand Up @@ -8,7 +8,7 @@

from pydantic import BaseModel, Field, validator

from app.db.models import AccessType, MediaType
from app.db.models import AccessType, MediaType, ObservationType


# Template classes
Expand Down Expand Up @@ -88,15 +88,12 @@ class MediaUrl(BaseModel):
# Annotation
class AnnotationIn(BaseModel):
media_id: int = Field(..., gt=0)
observations: List[ObservationType]


class AnnotationCreation(AnnotationIn):
bucket_key: str = Field(...)
class AnnotationUpdateIn(BaseModel):
observations: List[ObservationType]


class AnnotationOut(AnnotationIn, _CreatedAt, _Id):
pass


class AnnotationUrl(BaseModel):
url: str
14 changes: 11 additions & 3 deletions src/app/db/models.py
Original file line number Diff line number Diff line change
Expand Up @@ -5,7 +5,7 @@

import enum

from sqlalchemy import Column, DateTime, Enum, ForeignKey, Integer, String
from sqlalchemy import ARRAY, Column, DateTime, Enum, ForeignKey, Integer, String
from sqlalchemy.orm import relationship
from sqlalchemy.sql import func

Expand Down Expand Up @@ -46,15 +46,23 @@ def __repr__(self):
return f"<Media(bucket_key='{self.bucket_key}', type='{self.type}'>"


class ObservationType(str, enum.Enum):
clouds: str = "clouds"
fire: str = "fire"
fog: str = "fog"
sky: str = "sky"
smoke: str = "smoke"


class Annotations(Base):
__tablename__ = "annotations"

id = Column(Integer, primary_key=True)
media_id = Column(Integer, ForeignKey("media.id"))
bucket_key = Column(String(100), nullable=True)
observations = Column(ARRAY(Enum(ObservationType)), nullable=False)
created_at = Column(DateTime, default=func.now())

media = relationship("Media", uselist=False, back_populates="annotations")

def __repr__(self):
return f"<Media(media_id='{self.media_id}', bucket_key='{self.bucket_key}'>"
return f"<Media(media_id='{self.media_id}', observations='{self.observations}'>"
2 changes: 1 addition & 1 deletion src/tests/crud/test_authorizations.py
Original file line number Diff line number Diff line change
Expand Up @@ -19,7 +19,7 @@


ANNOTATIONS_TABLE = [
{"id": 1, "media_id": 1, "created_at": "2020-10-13T08:18:45.447773"},
{"id": 1, "media_id": 1, "observations": [], "created_at": "2020-10-13T08:18:45.447773"},
]


Expand Down
2 changes: 1 addition & 1 deletion src/tests/db_utils.py
Original file line number Diff line number Diff line change
Expand Up @@ -34,7 +34,7 @@ async def fill_table(test_db: Database, table: Table, entries: List[Dict[str, An
are not incremented if the "id" field is included
"""
if remove_ids:
entries = [{k: v for k, v in x.items() if k != "id"} for x in entries]
entries = [{k: v for k, v in entry.items() if k != "id"} for entry in entries]

query = table.insert().values(entries)
await test_db.execute(query=query)
Expand Down
Loading
Loading