Skip to content
GitLab
Explore
Sign in
Primary navigation
Search or go to…
Project
A
alibylite
Manage
Activity
Members
Labels
Plan
Issues
Issue boards
Milestones
Wiki
Code
Merge requests
Repository
Branches
Commits
Tags
Repository graph
Compare revisions
Snippets
Deploy
Releases
Package registry
Container Registry
Model registry
Operate
Terraform modules
Monitor
Incidents
Analyze
Value stream analytics
Contributor analytics
Repository analytics
Model experiments
Help
Help
Support
GitLab documentation
Compare GitLab plans
Community forum
Contribute to GitLab
Provide feedback
Keyboard shortcuts
?
Snippets
Groups
Projects
Show more breadcrumbs
Swain Lab
aliby
alibylite
Commits
27fd9ffd
Commit
27fd9ffd
authored
2 years ago
by
Alán Muñoz
Browse files
Options
Downloads
Patches
Plain Diff
[WIP] feat(dataset): add DatasetDir
parent
929d626f
No related branches found
No related tags found
No related merge requests found
Changes
2
Hide whitespace changes
Inline
Side-by-side
Showing
2 changed files
src/aliby/io/dataset.py
+44
-14
44 additions, 14 deletions
src/aliby/io/dataset.py
src/aliby/pipeline.py
+1
-1
1 addition, 1 deletion
src/aliby/pipeline.py
with
45 additions
and
15 deletions
src/aliby/io/dataset.py
+
44
−
14
View file @
27fd9ffd
...
...
@@ -5,9 +5,11 @@ Dataset is a group of classes to manage multiple types of experiments:
- Local experiments in a multidimensional OME-TIFF image containing the metadata
- Local experiments in a directory containing multiple positions in independent images with or without metadata
"""
import
os
import
shutil
import
time
import
typing
as
t
from
abc
import
ABC
,
abstractproperty
from
abc
import
ABC
,
abstractproperty
,
abstractmethod
from
pathlib
import
Path
,
PosixPath
from
typing
import
Union
...
...
@@ -27,7 +29,7 @@ class DatasetLocalABC(ABC):
_valid_meta_suffixes
=
(
"
txt
"
,
"
log
"
)
def
__init__
(
self
,
dpath
:
Union
[
str
,
PosixPath
],
*
args
,
**
kwargs
):
self
.
f
path
=
Path
(
dpath
)
self
.
path
=
Path
(
dpath
)
def
__enter__
(
self
):
return
self
...
...
@@ -37,34 +39,26 @@ class DatasetLocalABC(ABC):
@property
def
dataset
(
self
):
return
self
.
f
path
return
self
.
path
@property
def
name
(
self
):
return
self
.
f
path
.
name
return
self
.
path
.
name
@property
def
unique_name
(
self
):
return
self
.
f
path
.
name
return
self
.
path
.
name
@abstractproperty
def
date
(
self
):
pass
def
get_images
(
self
):
# Fetches all valid formats and overwrites if duplicates with different suffix
return
{
f
.
name
:
str
(
f
)
for
suffix
in
self
.
_valid_suffixes
for
f
in
self
.
fpath
.
glob
(
f
"
*.
{
suffix
}
"
)
}
@property
def
files
(
self
):
if
not
hasattr
(
self
,
"
_files
"
):
self
.
_files
=
{
f
:
f
for
f
in
self
.
f
path
.
rglob
(
"
*
"
)
for
f
in
self
.
path
.
rglob
(
"
*
"
)
if
any
(
str
(
f
).
endswith
(
suffix
)
for
suffix
in
self
.
_valid_meta_suffixes
...
...
@@ -78,11 +72,39 @@ class DatasetLocalABC(ABC):
shutil
.
copy
(
annotation
,
root_dir
/
name
.
name
)
return
True
@abstractmethod
def
get_images
(
self
):
# Return location of images and their unique names
pass
class
DatasetLocalDir
(
DatasetLocalABC
):
"""
Organise an entire dataset, composed of multiple images, as a directory containing directories with individual files.
It relies on ImageDir to manage images.
"""
def
__init__
(
self
,
dpath
:
Union
[
str
,
PosixPath
],
*
args
,
**
kwargs
):
super
().
__init__
(
dpath
)
@property
def
date
(
self
):
# Use folder creation date, for cases where metadata is minimal
return
time
.
strftime
(
"
%Y%m%d
"
,
time
.
strptime
(
time
.
ctime
(
os
.
path
.
getmtime
(
self
.
path
)))
)
def
get_images
(
self
):
return
[
folder
for
folder
in
self
.
path
.
glob
(
"
*/
"
)
if
any
(
path
for
suffix
in
self
.
_valid_meta_suffixes
for
path
in
folder
.
glob
(
f
"
*.
{
suffix
}
"
)
)
]
class
DatasetLocalOME
(
DatasetLocalABC
):
"""
Load a dataset from a folder
...
...
@@ -102,6 +124,14 @@ class DatasetLocalOME(DatasetLocalABC):
# Access the date from the metadata of the first position
return
ImageLocalOME
(
list
(
self
.
get_images
().
values
())[
0
]).
date
def
get_images
(
self
):
# Fetches all valid formats and overwrites if duplicates with different suffix
return
{
f
.
name
:
str
(
f
)
for
suffix
in
self
.
_valid_suffixes
for
f
in
self
.
path
.
glob
(
f
"
*.
{
suffix
}
"
)
}
class
Dataset
(
BridgeOmero
):
def
__init__
(
self
,
expt_id
,
**
server_info
):
...
...
This diff is collapsed.
Click to expand it.
src/aliby/pipeline.py
+
1
−
1
View file @
27fd9ffd
...
...
@@ -29,7 +29,7 @@ from agora.io.writer import ( # BabyWriter,
)
from
aliby.baby_client
import
BabyParameters
,
BabyRunner
from
aliby.haystack
import
initialise_tf
from
aliby.io.dataset
import
Dataset
,
DatasetLocal
from
aliby.io.dataset
import
Dataset
,
DatasetLocal
OME
,
DatasetLocalDir
from
aliby.io.image
import
get_image_class
from
aliby.tile.tiler
import
Tiler
,
TilerParameters
from
extraction.core.extractor
import
Extractor
,
ExtractorParameters
...
...
This diff is collapsed.
Click to expand it.
Preview
0%
Loading
Try again
or
attach a new file
.
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Save comment
Cancel
Please
register
or
sign in
to comment