File tree Expand file tree Collapse file tree 1 file changed +6
-1
lines changed
loading_pipeline/lib/tasks/reference_data Expand file tree Collapse file tree 1 file changed +6
-1
lines changed Original file line number Diff line number Diff line change 11import luigi
22
3+ from loading_pipeline .lib .annotations .expression_helpers import get_expr_for_variant_id
34from loading_pipeline .lib .core .dataset_type import DatasetType
45from loading_pipeline .lib .core .definitions import ReferenceGenome
56from loading_pipeline .lib .paths import reference_dataset_parquet
@@ -31,7 +32,11 @@ def output(self):
3132 )
3233
3334 def run (self ):
34- df = self .reference_dataset .get_spark_dataframe (self .reference_genome )
35+ ht = self .reference_dataset .get_ht (self .reference_genome )
36+ ht = ht .annotate (
37+ variant_id = get_expr_for_variant_id (ht ),
38+ )
39+ df = ht .to_spark (flatten = False )
3540 df .write .parquet (
3641 self .output ().path ,
3742 mode = 'overwrite' ,
You can’t perform that action at this time.
0 commit comments