# Data generation for RNA velocity analysis in dentate gyrus

Generates `.h5ad` files to analyze RNA velocy in dentate gyrus using different pre-processing protocols.

## Preliminaries

**Requires**

* `DATA_DIR/dentategyrus/Dentate_gyrus_adata_quantifications_combined.h5ad`

**Output**

* `DATA_DIR/dentategyrus/alevin_prepref_isocollapse_cdna_introns_decoy_gentrome.h5ad`
* `DATA_DIR/dentategyrus/alevin_prepref_isocollapse_cdna_introns_gentrome.h5ad`
* `DATA_DIR/dentategyrus/alevin_prepref_isoseparate_cdna_introns_decoy_gentrome.h5ad`
* `DATA_DIR/dentategyrus/alevin_prepref_isoseparate_cdna_introns_gentrome.h5ad`
* `DATA_DIR/dentategyrus/alevin_spliced_unspliced_gentrome.h5ad`
* `DATA_DIR/dentategyrus/kallisto_bustools_prepref_isocollapse_exclude.h5ad`
* `DATA_DIR/dentategyrus/kallisto_bustools_prepref_isocollapse_include.h5ad`
* `DATA_DIR/dentategyrus/kallisto_bustools_prepref_isoseparate_exclude.h5ad`
* `DATA_DIR/dentategyrus/kallisto_bustools_prepref_isoseparate_include.h5ad`
* `DATA_DIR/dentategyrus/starsolo.h5ad`
* `DATA_DIR/dentategyrus/starsolo_subtr.h5ad`

## Library imports

In [1]:
from pathlib import Path
import sys

# import standard packages
import pandas as pd

# import single-cell packages
from anndata import AnnData
import scanpy as sc

sys.path.append("../../..")
from paths import DATA_DIR

## Data loading

In [2]:
adata = sc.read(
    DATA_DIR / "dentategyrus" / "Dentate_gyrus_adata_quantifications_combined.h5ad"
)
adata

AnnData object with n_obs × n_vars = 2914 × 54144
    obs: 'cell_index', 'clusters', 'age.days.', 'clusters_enlarged'
    uns: 'X_name', 'dataset'
    obsm: 'PCA_alevin_spliced_gentrome', 'TSNE_alevin_spliced_gentrome', 'UMAP_alevin_spliced_gentrome'
    layers: 'alevin_prepref_isocollapse_cdna_introns_decoy_gentrome_spliced', 'alevin_prepref_isocollapse_cdna_introns_decoy_gentrome_unspliced', 'alevin_prepref_isocollapse_cdna_introns_gentrome_spliced', 'alevin_prepref_isocollapse_cdna_introns_gentrome_unspliced', 'alevin_prepref_isoseparate_cdna_introns_decoy_gentrome_spliced', 'alevin_prepref_isoseparate_cdna_introns_decoy_gentrome_unspliced', 'alevin_prepref_isoseparate_cdna_introns_gentrome_spliced', 'alevin_prepref_isoseparate_cdna_introns_gentrome_unspliced', 'alevin_spliced_gentrome_counts', 'alevin_spliced_unspliced_gentrome_spliced', 'alevin_spliced_unspliced_gentrome_unspliced', 'kallisto_bustools_prepref_isocollapse_exclude_unspliced', 'kallisto_bustools_prepref_isocollapse_i

## Data generation

In [3]:
alevin_coll_decoy_gtr = AnnData(
    X=adata.layers['alevin_prepref_isocollapse_cdna_introns_decoy_gentrome_spliced'],
    layers={
        'unspliced': adata.layers['alevin_prepref_isocollapse_cdna_introns_decoy_gentrome_unspliced'],
        'spliced': adata.layers['alevin_prepref_isocollapse_cdna_introns_decoy_gentrome_spliced'],
    },
    obs=adata.obs[['cell_index', 'clusters', 'age.days.', 'clusters_enlarged']],
    var=pd.DataFrame(index=adata.var_names),
)
alevin_coll_decoy_gtr.write(DATA_DIR / "dentategyrus" / "alevin_prepref_isocollapse_cdna_introns_decoy_gentrome.h5ad")

  alevin_coll_decoy_gtr = AnnData(


In [4]:
alevin_coll_gtr = AnnData(
    X=adata.layers['alevin_prepref_isocollapse_cdna_introns_gentrome_spliced'],
    layers={
        'unspliced': adata.layers['alevin_prepref_isocollapse_cdna_introns_gentrome_unspliced'],
        'spliced': adata.layers['alevin_prepref_isocollapse_cdna_introns_gentrome_spliced'],
    },
    obs=adata.obs[['cell_index', 'clusters', 'age.days.', 'clusters_enlarged']],
    var=pd.DataFrame(index=adata.var_names),
)
alevin_coll_gtr.write(DATA_DIR / "dentategyrus" / "alevin_prepref_isocollapse_cdna_introns_gentrome.h5ad")

  alevin_coll_gtr = AnnData(


In [5]:
alevin_sep_decoy_gtr = AnnData(
    X=adata.layers['alevin_prepref_isoseparate_cdna_introns_decoy_gentrome_spliced'],
    layers={
        'unspliced': adata.layers['alevin_prepref_isoseparate_cdna_introns_decoy_gentrome_unspliced'],
        'spliced': adata.layers['alevin_prepref_isoseparate_cdna_introns_decoy_gentrome_spliced'],
    },
    obs=adata.obs[['cell_index', 'clusters', 'age.days.', 'clusters_enlarged']],
    var=pd.DataFrame(index=adata.var_names),
)
alevin_sep_decoy_gtr.write(DATA_DIR / "dentategyrus" / "alevin_prepref_isoseparate_cdna_introns_decoy_gentrome.h5ad")

  alevin_sep_decoy_gtr = AnnData(


In [6]:
alevin_sep_gtr = AnnData(
    X=adata.layers['alevin_prepref_isoseparate_cdna_introns_gentrome_spliced'],
    layers={
        'unspliced': adata.layers['alevin_prepref_isoseparate_cdna_introns_gentrome_unspliced'],
        'spliced': adata.layers['alevin_prepref_isoseparate_cdna_introns_gentrome_spliced'],
    },
    obs=adata.obs[['cell_index', 'clusters', 'age.days.', 'clusters_enlarged']],
    var=pd.DataFrame(index=adata.var_names),
)
alevin_sep_gtr.write(DATA_DIR / "dentategyrus" / "alevin_prepref_isoseparate_cdna_introns_gentrome.h5ad")

  alevin_sep_gtr = AnnData(


In [7]:
alevin_spliced_unspliced_gtr = AnnData(
    X=adata.layers['alevin_spliced_unspliced_gentrome_spliced'],
    layers={
        'unspliced': adata.layers['alevin_spliced_unspliced_gentrome_unspliced'],
        'spliced': adata.layers['alevin_spliced_unspliced_gentrome_spliced'],
    },
    obs=adata.obs[['cell_index', 'clusters', 'age.days.', 'clusters_enlarged']],
    var=pd.DataFrame(index=adata.var_names),
)
alevin_spliced_unspliced_gtr.write(DATA_DIR / "dentategyrus" / "alevin_spliced_unspliced_gentrome.h5ad")

  alevin_spliced_unspliced_gtr = AnnData(


In [8]:
kalisto_bustools_coll_excl = AnnData(
    X=adata.X,
    layers={
        'unspliced': adata.layers['kallisto_bustools_prepref_isocollapse_exclude_unspliced'],
        'spliced': adata.X,
    },
    obs=adata.obs[['cell_index', 'clusters', 'age.days.', 'clusters_enlarged']],
    var=pd.DataFrame(index=adata.var_names),
)
kalisto_bustools_coll_excl.write(DATA_DIR / "dentategyrus" / "kallisto_bustools_prepref_isocollapse_exclude.h5ad")

In [9]:
kalisto_bustools_coll_incl = AnnData(
    X=adata.layers['kallisto_bustools_prepref_isocollapse_include_spliced'],
    layers={
        'unspliced': adata.layers['kallisto_bustools_prepref_isocollapse_include_unspliced'],
        'spliced': adata.layers['kallisto_bustools_prepref_isocollapse_include_spliced'],
    },
    obs=adata.obs[['cell_index', 'clusters', 'age.days.', 'clusters_enlarged']],
    var=pd.DataFrame(index=adata.var_names),
)
kalisto_bustools_coll_incl.write(DATA_DIR / "dentategyrus" / "kallisto_bustools_prepref_isocollapse_include.h5ad")

  kalisto_bustools_coll_incl = AnnData(


In [10]:
kalisto_bustools_sep_excl = AnnData(
    X=adata.layers['kallisto_bustools_prepref_isoseparate_exclude_spliced'],
    layers={
        'unspliced': adata.layers['kallisto_bustools_prepref_isoseparate_exclude_unspliced'],
        'spliced': adata.layers['kallisto_bustools_prepref_isoseparate_exclude_spliced'],
    },
    obs=adata.obs[['cell_index', 'clusters', 'age.days.', 'clusters_enlarged']],
    var=pd.DataFrame(index=adata.var_names),
)
kalisto_bustools_sep_excl.write(DATA_DIR / "dentategyrus" / "kallisto_bustools_prepref_isoseparate_exclude.h5ad")

  kalisto_bustools_sep_excl = AnnData(


In [11]:
kalisto_bustools_sep_incl = AnnData(
    X=adata.layers['kallisto_bustools_prepref_isoseparate_include_spliced'],
    layers={
        'unspliced': adata.layers['kallisto_bustools_prepref_isoseparate_include_unspliced'],
        'spliced': adata.layers['kallisto_bustools_prepref_isoseparate_include_spliced'],
    },
    obs=adata.obs[['cell_index', 'clusters', 'age.days.', 'clusters_enlarged']],
    var=pd.DataFrame(index=adata.var_names),
)
kalisto_bustools_sep_incl.write(DATA_DIR / "dentategyrus" / "kallisto_bustools_prepref_isoseparate_include.h5ad")

  kalisto_bustools_sep_incl = AnnData(


In [12]:
starsolo = AnnData(
    X=adata.layers['starsolo_spliced'],
    layers={
        'unspliced': adata.layers['starsolo_unspliced'],
        'spliced': adata.layers['starsolo_spliced'],
    },
    obs=adata.obs[['cell_index', 'clusters', 'age.days.', 'clusters_enlarged']],
    var=pd.DataFrame(index=adata.var_names),
)
starsolo.write(DATA_DIR / "dentategyrus" / "starsolo.h5ad")

  starsolo = AnnData(


In [13]:
starsolo_diff = AnnData(
    X=adata.layers['starsolo_subtr_spliced'],
    layers={
        'unspliced': adata.layers['starsolo_subtr_unspliced'],
        'spliced': adata.layers['starsolo_subtr_spliced'],
    },
    obs=adata.obs[['cell_index', 'clusters', 'age.days.', 'clusters_enlarged']],
    var=pd.DataFrame(index=adata.var_names),
)
starsolo_diff.write(DATA_DIR / "dentategyrus" / "starsolo_subtr.h5ad")

  starsolo_diff = AnnData(
