stdgcn Config

This is the config for stdgcn.

examples/tuning/deconv_stdgcn/hcc_liver/pipeline_params_tuning_config.yaml
---
type: preprocessor
tune_mode: pipeline_params
pipeline_tuning_top_k: 3
parameter_tuning_freq_n: 20
pipeline:
  - type: misc
    target: CelltypeTransform
  - type: pseudobulk
    target: pseudoSpotGen
    params:
      spot_num: 30000
      min_cell_number_in_spot: 8
      max_cell_number_in_spot: 12
      max_cell_types_in_spot: 4
      generation_method: celltype
      n_jobs: -1
  - type: misc
    target: RemoveSplit
    params:
      split_name: ref
      log_level: INFO
  - type: filter.gene
    target: FilterGenesCommon
    params:
      split_keys: [pseudo, test]
  - type: filter.gene
    include:
      - FilterGenesPercentile
      - FilterGenesScanpyOrder
      - FilterGenesPlaceHolder
    default_params:
      FilterGenesScanpyOrder:
        order: [min_counts, max_counts, min_cells, max_cells]
        min_counts: 100
        max_counts: 0.99
        min_cells: 0.01
        max_cells: 0.99
  - type: misc
    target: SaveRaw
  - type: normalize
    include:
      - ColumnSumNormalize
      - ScTransform
      - Log1P
      - NormalizeTotal
      - NormalizePlaceHolder
      - NormalizeTotalLog1P
    default_params:
      ScTransform:
        processes_num: 8
  - type: filter.gene
    include:
      - HighlyVariableGenesLogarithmizedByMeanAndDisp
      - HighlyVariableGenesRawCount
      - FilterGenesNumberPlaceHolder
      - HighlyVariableGenesLogarithmizedByTopGenes
      - FilterGenesTopK
      - FilterGenesRegression
    default_params:
      FilterGenesTopK:
        num_genes: 3000
      FilterGenesRegression:
        num_genes: 3000
      HighlyVariableGenesRawCount:
        n_top_genes: 3000
      HighlyVariableGenesLogarithmizedByTopGenes:
        n_top_genes: 3000
  - type: misc
    target: updateAnndataObsTransform
    params:
      split: test
  - type: misc
    target: CellTypeNum
  - type: feature.cell
    include:
      - CellPCA
      - CellSVD
      - WeightedFeaturePCA
      - WeightedFeatureSVD
      - GaussRandProjFeature
      - FeatureCellPlaceHolder
    params:
      out: feature.cell
      log_level: INFO
    default_params:
      CellPCA:
        n_components: 400
      CellSVD:
        n_components: 400
      GaussRandProjFeature:
        n_components: 400
      WeightedFeaturePCA:
        n_components: 400
      WeightedFeatureSVD:
        n_components: 400
  - type: data.interagration
    target: DataInteragraionTransform
    params:
      batch_removal_method:
      min_dim: 30
      dimensionality_reduction_method:
      scale: false
      cpu_num: 1
      AE_device: cpu
  - type: graph.cell
    target: stdgcnGraph
    params:
      inter_find_neighbor_method: MNN
      inter_dist_method: cosine
      inter_corr_dist_neighbors: 20
      spatial_link_method: soft
      space_dist_threshold: 2.0
      real_intra_find_neighbor_method: MNN
      real_intra_dist_method: cosine
      real_intra_pca_dimensionality_reduction: false
      real_intra_corr_dist_neighbors: 10
      real_intra_dim: 50
      pseudo_intra_find_neighbor_method: MNN
      pseudo_intra_dist_method: cosine
      pseudo_intra_corr_dist_neighbors: 20
      pseudo_intra_pca_dimensionality_reduction: false
      pseudo_intra_dim: 50
  - type: data.interagration
    target: DataInteragraionTransform
    params:
      batch_removal_method:
      min_dim: 80
      dimensionality_reduction_method:
      scale: false
      cpu_num: 1
      AE_device: cpu
  - type: misc
    target: SetConfig
    params:
      config_dict:
        label_channel: cell_type_portion
wandb:
  entity: xzy11632
  project: dance-dev
  method: grid  # try grid to provide a comprehensive search
  metric:
    name: MSE
    goal: minimize