Module molcrawl.rna.utils.config
Classes
class CellxGenePreparationConfig (output_dir: str = 'learning_source_dummy/rna',
num_worker: int = 8,
size_workload: int = 10000,
census_version: str = '2023-12-15',
min_counts_genes: int = 2,
sqrt_scale_factor: float = 0)-
Expand source code
@dataclass class CellxGenePreparationConfig: # Output directory where the preparation will be made output_dir: str = RNA_DATASET_DIR # Num of worker to use during parallel processing. num_worker: int = 8 # Size of list of ids to give to each worker, save file will have `size_workload` number of ids in them. size_workload: int = 10000 # Version of the CellxGene census census_version: str = "2023-12-15" # Filter condition to filter genes with few counts across a dataset. min_counts_genes: int = 2 # Sqrt-scaling factor C for per-tissue cell subsampling. # Each tissue retains min(N, C * sqrt(N)) cells drawn without replacement. # Set to 0 (or omit) to disable subsampling and use all cells. sqrt_scale_factor: float = 0CellxGenePreparationConfig(output_dir: str = 'learning_source_dummy/rna', num_worker: int = 8, size_workload: int = 10000, census_version: str = '2023-12-15', min_counts_genes: int = 2, sqrt_scale_factor: float = 0)
Instance variables
var census_version : strvar min_counts_genes : intvar num_worker : intvar output_dir : strvar size_workload : intvar sqrt_scale_factor : float
class RnaConfig (data_preparation: CellxGenePreparationConfig = <factory>)-
Expand source code
@dataclass class RnaConfig(Config): data_preparation: CellxGenePreparationConfig = field(default_factory=CellxGenePreparationConfig) def __post_init__(self): if not isinstance(self.data_preparation, CellxGenePreparationConfig): # type: ignore[misc] self.data_preparation = CellxGenePreparationConfig(**self.data_preparation) # type: ignore[arg-type]RnaConfig(data_preparation: molcrawl.rna.utils.config.CellxGenePreparationConfig =
) Ancestors
Instance variables
var data_preparation : CellxGenePreparationConfig
Inherited members