33import gzip
44import os
55import pickle
6- from datetime import datetime
6+ from datetime import datetime , UTC
77
88from codex .data .neuron_data_initializer import (
99 initialize_neuron_data ,
1717DATA_ROOT_PATH = "static/data"
1818NEURON_FILE_NAME = "neurons.csv.gz"
1919CLASSIFICATION_FILE_NAME = "classification.csv.gz"
20+ CONSOLIDATED_CELL_TYPES_FILE_NAME = "consolidated_cell_types.csv.gz"
2021CELL_STATS_ROWS = "cell_stats.csv.gz"
2122CONNECTIONS_FILE_NAME = "connections.csv.gz"
2223LABELS_FILE_NAME = "labels.csv.gz"
2324COORDINATES_FILE_NAME = "coordinates.csv.gz"
2425NBLAST_FILE_NAME = "nblast.csv.gz"
2526CONNECTIVITY_TAGS_FILE_NAME = "connectivity_tags.csv.gz"
26- MORPHOLOGY_CLUSTERS_FILE_NAME = "morphology_clusters.csv.gz"
27- CONNECTIVITY_CLUSTERS_FILE_NAME = "connectivity_clusters.csv.gz"
28- SVD_FILE_NAME = "svd.csv.gz"
29- LR_MATCHING_FILE_NAME = "lr_matching.csv.gz"
3027
3128
3229NEURON_DB_PICKLE_FILE_NAME = "neuron_db.pickle.gz"
3330
34- GCS_PICKLE_URL_TEMPLATE = "https://storage.googleapis.com/flywire-data/codex/data/{version}/neuron_db.pickle.gz"
31+ GCS_PICKLE_URL_TEMPLATE = "https://storage.googleapis.com/flywire-data/codex/data/fafb/ {version}/neuron_db.pickle.gz"
3532GCS_RAW_DATA_URL_TEMPLATE = (
36- "https://storage.googleapis.com/flywire-data/codex/data/{version}/{filename}"
33+ "https://storage.googleapis.com/flywire-data/codex/data/fafb/ {version}/{filename}"
3734)
3835
3936
@@ -67,8 +64,8 @@ def _read_data(filename, with_timestamp=False):
6764 if os .path .exists (fname ):
6865 rows = read_csv (fname )
6966 if with_timestamp :
70- return rows , datetime .utcfromtimestamp (
71- os .path .getmtime (fname )
67+ return rows , datetime .fromtimestamp (
68+ os .path .getmtime (fname ), UTC
7269 ).strftime ("%Y-%m-%d" )
7370 else :
7471 return rows
@@ -80,6 +77,7 @@ def _read_data(filename, with_timestamp=False):
8077
8178 neuron_rows = _read_data (NEURON_FILE_NAME )
8279 classification_rows = _read_data (CLASSIFICATION_FILE_NAME )
80+ cell_type_rows = _read_data (CONSOLIDATED_CELL_TYPES_FILE_NAME )
8381 cell_stats_rows = _read_data (CELL_STATS_ROWS )
8482 connection_rows = _read_data (CONNECTIONS_FILE_NAME )
8583 label_rows , labels_file_timestamp = _read_data (
@@ -88,10 +86,6 @@ def _read_data(filename, with_timestamp=False):
8886 coordinate_rows = _read_data (COORDINATES_FILE_NAME )
8987 nblast_rows = _read_data (NBLAST_FILE_NAME )
9088 connectivity_tag_rows = _read_data (CONNECTIVITY_TAGS_FILE_NAME )
91- morphology_cluster_rows = _read_data (MORPHOLOGY_CLUSTERS_FILE_NAME )
92- connectivity_cluster_rows = _read_data (CONNECTIVITY_CLUSTERS_FILE_NAME )
93- svd_rows = _read_data (SVD_FILE_NAME )
94- lr_matching_rows = _read_data (LR_MATCHING_FILE_NAME )
9589
9690 print (
9791 f" loading data from { data_file_path } :\n "
@@ -104,23 +98,21 @@ def _read_data(filename, with_timestamp=False):
10498 neuron_db = initialize_neuron_data (
10599 neuron_file_rows = neuron_rows ,
106100 classification_rows = classification_rows ,
101+ cell_type_rows = cell_type_rows ,
107102 cell_stats_rows = cell_stats_rows ,
108103 connection_rows = connection_rows ,
109104 label_rows = label_rows ,
110105 labels_file_timestamp = labels_file_timestamp ,
111106 coordinate_rows = coordinate_rows ,
112107 nblast_rows = nblast_rows ,
113108 connectivity_tag_rows = connectivity_tag_rows ,
114- morphology_cluster_rows = morphology_cluster_rows ,
115- connectivity_cluster_rows = connectivity_cluster_rows ,
116- svd_rows = svd_rows ,
117- lr_matching_rows = lr_matching_rows ,
118109 )
119110 # free mem
120111 del neuron_rows
121112 del connection_rows
122113 del label_rows
123114 del coordinate_rows
115+ del cell_type_rows
124116 return neuron_db
125117
126118
0 commit comments