documentation of read_csv

2023-01-01 18:01:57 +05:30 · 2023-01-01 18:01:57 +05:30 · 3a5ca91234
commit 3a5ca91234
parent db8f73d5c6
1 changed files with 49 additions and 3 deletions
--- a/pyfacts/pyfacts.py
+++ b/pyfacts/pyfacts.py
@ -568,6 +568,7 @@ class TimeSeries(TimeSeriesCore):
        Parameters
        ----------
        kwargs: parameters to be passed to the calculate_rolling_returns() function
                Refer TimeSeries.calculate_rolling_returns() method for more details
        Returns
        -------
@ -866,7 +867,9 @@ class TimeSeries(TimeSeriesCore):
        return self.__class__(new_ts_dict, to_frequency.symbol)
-def _preprocess_csv(file_path: str | pathlib.Path, delimiter: str = ",", encoding: str = "utf-8") -> List[list]:
+def _preprocess_csv(
    file_path: str | pathlib.Path, delimiter: str = ",", encoding: str = "utf-8", **kwargs
 ) -> List[list]:
    """Preprocess csv data"""
    if isinstance(file_path, str):
@ -876,7 +879,7 @@ def _preprocess_csv(file_path: str | pathlib.Path, delimiter: str = ",", encodin
        raise ValueError("File not found. Check the file path")
    with open(file_path, "r", encoding=encoding) as file:
-        reader: csv.reader = csv.reader(file, delimiter=delimiter)
+        reader: csv.reader = csv.reader(file, delimiter=delimiter, **kwargs)
        csv_data: list = list(reader)
    csv_data = [i for i in csv_data if i]  # remove blank rows
@ -897,8 +900,51 @@ def read_csv(
    nrows: int = -1,
    delimiter: str = ",",
    encoding: str = "utf-8",
    **kwargs,
 ) -> TimeSeries:
-    """Reads Time Series data directly from a CSV file"""
+    """Reads Time Series data directly from a CSV file
    Parameters
    ----------
    csv_file_pah:
        path of the csv file to be read.
    frequency:
        frequency of the time series data.
    date_format:
        date format, specified as datetime compatible string
    col_names:
        specify the column headers to be read.
        this parameter will allow you to read two columns from a CSV file which may have more columns.
        this parameter overrides col_index parameter.
    dol_index:
        specify the column numbers to be read.
        this parameter will allow you to read two columns from a CSV file which may have more columns.
        if neither names nor index is specified, the first two columns from the csv file will be read,
        with the first being treated as date.
    has_header:
        specify whether the file has a header row.
        if true, the header row will be ignored while creating the time series data.
    skip_rows:
        the number of rows after the header which should be skipped.
    nrows:
        the number of rows to be read from the csv file.
    delimiter:
        specify the delimeter used in the csv file.
    encoding:
        specify the encoding of the csv file.
    kwargs:
        other keyword arguments to be passed on the csv.reader()
    """
    data = _preprocess_csv(csv_file_path, delimiter, encoding)