Module src.data.world
Expand source code
import pathlib
from typing import Tuple
from src.utils import get_paths
import pandas as pd
import collections
INPUT_FILE = "SOCA_GLOBAL2_20200310.csv"
META_FILE = "METADATA_20200310.csv"
PATHS = get_paths()
FEATURES = collections.namedtuple("FEATURES", ["meta", "input", "output"])
world_features = FEATURES(
meta=["wmo", "n_cycle", "N", "lon", "lat", "juld", "date"],
input=[
"sla",
"PAR",
"RHO_WN_412",
"RHO_WN_443",
"RHO_WN_490",
"RHO_WN_555",
"RHO_WN_670",
"doy_sin",
"doy_cos",
"x_cart",
"y_cart",
"z_cart",
"PC1",
"PC2",
"PC3",
"PC4",
"PC5",
"PC6",
"PC7",
"PC1.1",
"PC2.1",
"PC3.1",
"PC1.2",
"PC2.2",
"PC3.2",
"PC4.1",
],
output=[
"bbp",
"bbp.1",
"bbp.2",
"bbp.3",
"bbp.4",
"bbp.5",
"bbp.6",
"bbp.7",
"bbp.8",
"bbp.9",
"bbp.10",
"bbp.11",
"bbp.12",
"bbp.13",
"bbp.14",
"bbp.15",
"bbp.16",
"bbp.17",
"bbp.18",
],
)
def get_meta_data() -> pd.DataFrame:
return pd.read_csv(f"{PATHS.data_processed.joinpath(META_FILE)}")
def get_input_data() -> pd.DataFrame:
return pd.read_csv(f"{PATHS.data_processed.joinpath(INPUT_FILE)}")
def get_full_data() -> pd.DataFrame:
return pd.merge(get_meta_data(), get_input_data()).set_index(world_features.meta)
Functions
def get_full_data() -> pandas.core.frame.DataFrame
-
Expand source code
def get_full_data() -> pd.DataFrame: return pd.merge(get_meta_data(), get_input_data()).set_index(world_features.meta)
def get_input_data() -> pandas.core.frame.DataFrame
-
Expand source code
def get_input_data() -> pd.DataFrame: return pd.read_csv(f"{PATHS.data_processed.joinpath(INPUT_FILE)}")
def get_meta_data() -> pandas.core.frame.DataFrame
-
Expand source code
def get_meta_data() -> pd.DataFrame: return pd.read_csv(f"{PATHS.data_processed.joinpath(META_FILE)}")
Classes
class FEATURES (meta, input, output)
-
FEATURES(meta, input, output)
Ancestors
- builtins.tuple
Instance variables
var input
-
Alias for field number 1
var meta
-
Alias for field number 0
var output
-
Alias for field number 2