22import json
33import multiprocessing as mp
44import os
5+ from glob import glob
56
67import fsspec
78import numpy as np
89import pandas as pd
9- from tqdm import tqdm
1010from args import parse_args
11- from glob import glob
11+ from tqdm import tqdm
1212
1313
1414def scan_csv (year , root_path , region , model , data = "picks" , fs = None , bucket = None , protocol = "file" ):
@@ -24,6 +24,7 @@ def scan_csv(year, root_path, region, model, data="picks", fs=None, bucket=None,
2424 csvs = fs .glob (f"{ jday } /??/*.csv" )
2525 else :
2626 csvs = glob (f"{ root_path } /{ region } /{ model } /{ data } _{ model } /{ year } /{ jday } /??/*.csv" )
27+ # csvs = glob(f"{root_path}/{region}/{model}/{data}_{model}/{year}/{jday}/*.csv")
2728
2829 csv_list .extend ([[year , jday , csv ] for csv in csvs ])
2930
@@ -129,6 +130,10 @@ def read_csv(rows, region, model, data, year, jday, root_path, fs=None, bucket=N
129130 for csv in tqdm (csvs , desc = f"Merge { data } csv files" ):
130131 picks .append (pd .read_csv (csv , dtype = str ))
131132 picks = pd .concat (picks , ignore_index = True )
133+ print (f"Number of { data } : { len (picks ):,} " )
134+ if data == "picks" :
135+ print (f"Number of P picks: { len (picks [picks ['phase_type' ] == 'P' ]):,} " )
136+ print (f"Number of S picks: { len (picks [picks ['phase_type' ] == 'S' ]):,} " )
132137 picks .to_csv (f"{ root_path } /{ region } /{ model } /{ model } _{ data } .csv" , index = False )
133138
134139 # %%
0 commit comments