Task 4
Task 4
# Load data
def load_data(path: str = "/path/to/csv/"):
"""
This function takes a path string to a CSV file and loads it into
a Pandas DataFrame.
df = pd.read_csv(f"{path}")
df.drop(columns=["Unnamed: 0"], inplace=True, errors='ignore')
return df
:return X: pd.DataFrame
y: pd.Series
"""
X = data.drop(columns=[target])
y = data[target]
return X, y
# Train algorithm
def train_algorithm_with_cross_validation(
X: pd.DataFrame = None,
y: pd.Series = None
):
"""
This function takes the predictor and target variables and
trains a Random Forest Regressor model across K folds. Using
cross-validation, performance metrics will be output for each
fold during training.
:return
"""
# Train model
trained_model = model.fit(X_train, y_train)