|
a |
|
b/tests/test_dataset_assumptions.py |
|
|
1 |
import pytest |
|
|
2 |
import os |
|
|
3 |
import pandas as pd |
|
|
4 |
|
|
|
5 |
metadata = pd.read_csv("metadata.csv") |
|
|
6 |
|
|
|
7 |
def test_no_duplicate_images(): |
|
|
8 |
filenames = metadata["filename"] |
|
|
9 |
assert len(set(filenames)) == len(filenames) |
|
|
10 |
|
|
|
11 |
def test_no_unlinked_images(): |
|
|
12 |
linked_images = metadata["filename"] |
|
|
13 |
all_images = os.listdir("images") |
|
|
14 |
#The only unlinked image should be the warning image |
|
|
15 |
assert set(all_images).difference(set(linked_images)) == set(['FAFA-A1BF-49A8-A1D3-66FAFA41B7345D.jpg']) |
|
|
16 |
|
|
|
17 |
def test_no_pediatric(): |
|
|
18 |
assert min(metadata["age"]) >= 18 |