LSSTDESC
diff --git a/‎examples/cardinal_project.yaml‎
Lines changed: 64 additions & 0 deletions b/‎examples/cardinal_project.yaml‎
Lines changed: 64 additions & 0 deletions
diff --git a/‎examples/cardinal_project_library.yaml‎
Lines changed: 292 additions & 0 deletions b/‎examples/cardinal_project_library.yaml‎
Lines changed: 292 additions & 0 deletions
diff --git a/‎examples/rail_project_example.ipynb‎
Lines changed: 3 additions & 3 deletions b/‎examples/rail_project_example.ipynb‎
Lines changed: 3 additions & 3 deletions
@@ -0,0 +1,64 @@
+Project:
+
+  Name: test_cardinal
+
+  # Include other configuration files
+  Includes:
+    - examples/cardinal_project_library.yaml
+
+  PathTemplates: {}
+
+  CommonPaths:
+    root: /global/cfs/cdirs/lsst/groups/PZ/Cardinal
+    scratch_root: "{root}"
+    catalogs_dir: "{root}/parquet_files"
+    project: test_cardinal
+    sim_version: v1
+
+  # Baseline configuraiton, included in others by default
+  Baseline:
+    catalog_tag: cardinal
+    pipelines: ['all']
+    file_aliases:  # Set the training and test files
+      test: test_file_100k
+      train: train_file_100k
+      train_zCOSMOS: train_file_zCOSMOS_100k
+      wide: wide_file_full
+      deep: deep_file_full
+      spec: spec_file_full
+
+  # These define the variant configurations for the various parts of the analysis
+  Flavors:
+    - Flavor:
+        name: train_cosmos
+        pipelines: ['pz', 'tomography']
+        file_aliases:  # Set the training and test files
+          test: test_file_100k
+          train: train_file_zCOSMOS_100k
+    - Flavor:
+        name: gpz_gl
+        pipelines: ['pz']  # only run the pz pipeline
+        pipeline_overrides:  # Override specifics for particular pipelines
+          default:
+            kwargs:
+              algorithms: ['gpz']  # Only run gpz
+          inform:
+            inform_gpz:
+              gpz_method: GL
+
+  # These are variables that we iterate over when running over entire catalogs
+  IterationVars:
+    healpix:
+      - 427
+      - 428
+      - 429
+      - 430
+      - 431
+      - 432
+      - 73
+      - 122
+      - 99
+      - 16
+      - 58
+      - 277
+      - 346
@@ -0,0 +1,292 @@
+# This is the "library" of common defintions shared between similar projects
+
+# Templates we use to define catalogs
+#
+# A CatalogTemplate can be given several interpolants to resolve to a specific Catalog
+#
+# Some of the interpolants [{catalogs_dir}, {project}, {sim_version}]
+# are defined in the Project CommonPaths block
+#
+# Possibles values of {selection} are defined the the library "Selections" block
+#
+# Possible values of {flavor} are defined the the Project "Flavors" block
+Catalogs:
+  # The input "Truth" catalog
+  - CatalogTemplate:
+      name: truth
+      path_template: "{catalogs_dir}/Chinchilla-3-triofile.{healpix}.parquet"
+      iteration_vars: ['healpix']
+  # Catalogs that have been reduced using a particular selection
+  - CatalogTemplate:
+      name: reduced
+      path_template: "{catalogs_dir}/{project}_{selection}/{healpix}/Chinchilla-3-triofile.pq"
+      iteration_vars: ['healpix']
+  # Data output from running some degraders on the original catalog
+  # Note that the {basename} can be used to select which degraded output we want
+  - CatalogTemplate:
+      name: degraded
+      path_template: "{catalogs_dir}/{project}_{selection}_{flavor}/{healpix}/{basename}"
+      iteration_vars: ['healpix']
+
+
+# This file describes the templates we use to define files and specfic instances
+# of files
+#
+# A FileTemplate can be given several interpolants to resolve to a specific FileInstance
+#
+# Some of the interpolants [{catalogs_dir}, {project}]
+# are defined in the Project CommonPaths block
+#
+# Possibles values of {selection} are defined the the library "Selections" block
+Files:
+  # Testing data file
+  - FileTemplate:
+      name: test_file_100k
+      path_template: "{catalogs_dir}/test/{project}_{selection}_baseline_100k.hdf5"
+  # Generic training data file
+  - FileTemplate:
+      name: train_file_100k
+      path_template: "{catalogs_dir}/test/{project}_{selection}_baseline_100k.hdf5"
+  - FileTemplate:
+      name: train_file_200k
+      path_template: "{catalogs_dir}/test/{project}_{selection}_baseline_200k.hdf5"
+  - FileTemplate:
+      name: train_file_10
+      path_template: "{catalogs_dir}/test/{project}_{selection}_baseline_10.hdf5"
+  - FileTemplate:
+      name: test_split_file
+      path_template: "{catalogs_dir}/test/{project}_{selection}_baseline_split_test_10.hdf5"
+  - FileTemplate:
+      name: train_split_file
+      path_template: "{catalogs_dir}/train/{project}_{selection}_baseline_split_train_10.hdf5"      
+  - FileTemplate:
+      name: deep_file_full
+      path_template: "{catalogs_dir}/som/{project}_deep_data_full.hdf5"
+  - FileTemplate:
+      name: deep_file_small
+      path_template: "{catalogs_dir}/som/{project}_deep_data_small.hdf5"
+  - FileTemplate:
+      name: wide_file_full
+      path_template: "{catalogs_dir}/som/{project}_wide_data_full.hdf5"
+  - FileTemplate:
+      name: wide_file_small
+      path_template: "{catalogs_dir}/som/{project}_wide_data_small.hdf5"
+  - FileTemplate:
+      name: spec_file_full
+      path_template: "{catalogs_dir}/som/{project}_spec_data_full.hdf5"
+  - FileTemplate:
+      name: spec_file_small
+      path_template: "{catalogs_dir}/som/{project}_spec_data_small.hdf5"
+
+
+# The next plots list all available algorithms of various types and assigns short names each of then
+#
+
+# These	describe all the algorithms that emulate spectroscopic selections
+SpecSelections:
+  - SpecSelection:
+      name: zCOSMOS
+      Select: SpecSelection_zCOSMOS
+      Module: rail.creation.degraders.spectroscopic_selections
+
+
+# These describe all the algorithms that estimate PZ
+PZAlgorithms:
+  - PZAlgorithm:
+      name: trainz
+      Estimate: TrainZEstimator
+      Inform: TrainZInformer
+      Module: rail.estimation.algos.train_z
+  - PZAlgorithm:
+      name: simplenn
+      Estimate: SklNeurNetEstimator
+      Inform: SklNeurNetInformer
+      Module: rail.estimation.algos.sklearn_neurnet
+  - PZAlgorithm:
+      name: fzboost
+      Estimate: FlexZBoostEstimator
+      Inform: FlexZBoostInformer
+      Module: rail.estimation.algos.flexzboost
+  - PZAlgorithm:
+      name: knn
+      Estimate: KNearNeighEstimator
+      Inform: KNearNeighInformer
+      Module: rail.estimation.algos.k_nearneigh
+  - PZAlgorithm:
+      name: gpz
+      Estimate: GPzEstimator
+      Inform: GPzInformer
+      Module: rail.estimation.algos.gpz
+
+
+# These describe all the algorithms that classify objects into tomographic bins
+Classifiers:
+  - Classifier:
+      name: equal_count
+      Classify: EqualCountClassifier
+      Module: rail.estimation.algos.equal_count
+  - Classifier:
+      name: uniform_binning
+      Classify: UniformBinningClassifier
+      Module: rail.estimation.algos.uniform_binning
+
+
+# These describe the error models we use in the truth_to_observed pipeline
+ErrorModels:
+  - ErrorModel:
+      name: lsst
+      ErrorModel: LSSTErrorModel
+      Module: rail.creation.degraders.photometric_errors
+  - ErrorModel:
+      name: roman
+      ErrorModel: RomanErrorModel
+      Module: rail.creation.degraders.photometric_errors
+
+
+# These describe the ways we can sub-sample the data
+Subsamplers:
+  - Subsampler:
+      name: random_subsampler
+      Subsample: RandomSubsampler
+      Module: rail.projects.subsampler
+  - Subsampler:
+      name: multi_catalog_subsampler
+      Subsample: MultiCatalogSubsample
+      Module: rail.projects.subsampler
+
+
+# These describe the ways we can reduce the data
+Reducers:
+  - Reducer:
+      name: cardinal
+      Reduce: CardinalReducer
+      Module: rail.projects.reducer
+
+
+# These describe the various data analysis pipelines
+Pipelines:
+  - PipelineTemplate:
+      name: truth_to_observed
+      pipeline_class: rail.pipelines.degradation.truth_to_observed.TruthToObservedPipeline
+      input_catalog_template: reduced
+      output_catalog_template: degraded
+      kwargs:
+        error_models: ['all']
+        selectors: ['all']
+        blending: true
+  - PipelineTemplate:
+      name: prepare
+      pipeline_class: rail.pipelines.utils.prepare_observed.PrepareObservedPipeline
+      input_catalog_template: reduced
+      output_catalog_template: degraded
+  - PipelineTemplate:
+      name: photometric_errors
+      pipeline_class: rail.pipelines.degradation.apply_phot_errors.ApplyPhotErrorsPipeline
+      input_catalog_template: reduced
+      output_catalog_template: degraded
+      kwargs:
+        error_models: ['all']
+  - PipelineTemplate:
+      name: spec_selection
+      input_catalog_template: degraded
+      output_catalog_template: degraded
+      input_catalog_basename: output_dereddener_errors.pq
+      pipeline_class: rail.pipelines.degradation.spectroscopic_selection_pipeline.SpectroscopicSelectionPipeline
+      kwargs:
+        selectors: ['all']
+  - PipelineTemplate:
+      name: inform
+      pipeline_class: rail.pipelines.estimation.inform_all.InformPipeline
+      input_catalog_template: degraded
+      output_catalog_template: degraded
+      input_file_templates:
+        input:
+          flavor: baseline
+          tag: train
+      kwargs:
+        algorithms: ['all']
+  - PipelineTemplate:
+      name: estimate
+      pipeline_class: rail.pipelines.estimation.estimate_all.EstimatePipeline
+      input_catalog_template: degraded
+      output_catalog_template: degraded
+      input_file_templates:
+        input:
+          flavor: baseline
+          tag: test
+      kwargs:
+        algorithms: ['all']
+  - PipelineTemplate:
+      name: evaluate
+      pipeline_class: rail.pipelines.evaluation.evaluate_all.EvaluationPipeline
+      input_catalog_template: degraded
+      output_catalog_template: degraded
+      input_file_templates:
+        truth:
+          flavor: baseline
+          tag: test
+      kwargs:
+        algorithms: ['all']
+  - PipelineTemplate:
+      name: pz
+      pipeline_class: rail.pipelines.estimation.pz_all.PzPipeline
+      input_catalog_template: degraded
+      output_catalog_template: degraded
+      input_file_templates:
+        input_train:
+          flavor: baseline
+          tag: train
+        input_test:
+          flavor: baseline
+          tag: test
+      kwargs:
+        algorithms: ['all']
+# These describe the selections going from "truth" to "reduced" catalog
+
+# These just all use different limiting i-band magnitudes
+Selections:
+  - Selection:
+      name: maglim_25.5
+      cuts:
+        maglim_i: [null, 25.5]
+  - Selection:
+      name: gold
+      cuts:
+        maglim_i: [null, 25.5]
+  - Selection:
+      name: blend
+      cuts:
+        maglim_i: [null, 26.0]
+  - Selection:
+      name: crap
+      cuts:
+        maglim_i: [null, 30.0]
+  - Selection:
+      name: all
+      cuts:
+        maglim_i: [null, null]
+
+# These describe the subsampling used to make test and training datasets
+Subsamples:
+  # Testing subsample with 100 events
+  - Subsample:
+      name: test_100k
+      seed: 1234
+      num_objects: 100000
+  # Training subsample with 100k events, and a different seed to select the events
+  - Subsample:
+      name: train_100k
+      seed: 4321
+      num_objects: 100000
+  # Training subsample with 100k events, and a different seed to select the events
+  - Subsample:
+      name: train_200k
+      seed: 5555
+      num_objects: 200000
+
+# These describe the ways we can split the data
+Splitters:
+  - Splitter:
+      name: random_splitter
+      Split: RandomSplitter
+      Module: rail.projects.splitter
@@ -215,9 +215,9 @@
  ],
  "metadata": {
   "kernelspec": {
-   "display_name": "Python 3 (ipykernel)",
+   "display_name": "testenv",
    "language": "python",
-   "name": "python3"
+   "name": "testenv"
   },
   "language_info": {
    "codemirror_mode": {
@@ -229,7 +229,7 @@
    "name": "python",
    "nbconvert_exporter": "python",
    "pygments_lexer": "ipython3",
-   "version": "3.11.4"
+   "version": "3.12.12"
   }
  },
  "nbformat": 4,