FileReader

`FileReader`

Provide functionality to read, filter, and write data from a TXT file located in the TxtInOut folder.

Source code in pySWATPlus/filereader.py

class FileReader:

    '''
    Provide functionality to read, filter, and write data
    from a TXT file located in the `TxtInOut` folder.
    '''

    def __init__(
        self,
        path: str | pathlib.Path,
        has_units: bool,
    ):
        '''
        Initialize a FileReader instance to read data from a TXT file.

        Args:
            path (str or Path): Path to the TXT file to be read.
            has_units (bool): If `True`, the second row of the file contains units.

        Example:
            ```python
            reader = FileReader(
                path='C:\\users\\username\\project\\Scenarios\\Default\\TxtInOut\\plants.plt',
                has_units=False
            )
            ```
        '''

        if not isinstance(path, (str, pathlib.Path)):
            raise TypeError("path must be a string or Path object")

        path = pathlib.Path(path).resolve()

        if not path.is_file():
            raise FileNotFoundError("file does not exist")

        self.has_units = has_units

        # if output ends with _day, _mon, _yr, _aa, _subday (removing the suffix), it means is an output file from SWAT.
        # if file is a csv is output file
        self.is_output_file = path.stem.endswith(('_day', '_mon', '_yr', '_aa', '_subday')) or path.suffix == '.csv'

        # skips the header
        skip_rows = [0, 2] if self.has_units else [0]

        # read only first line of file
        with open(path, 'r', encoding='latin-1') as file:
            self.header_file = file.readline()

        self.df = utils._load_file(path, skip_rows=skip_rows)

        # if file is a csv is output file
        if path.suffix == '.csv' and self.has_units:
            _df = pandas.read_csv(path, skiprows=[0], nrows=2, header=None, skipinitialspace=True)
            self.units_row = utils._clean(_df).iloc[1].copy()

        elif self.has_units:  # has_units and txt file
            # Units row may have some empty values, so we cannot use read_csv.
            # We'll use read_fwf; infer number of columns using first data row.
            _df = pandas.read_fwf(path, skiprows=[0, 1], nrows=2, header=None)
            self.units_row = utils._clean(_df).iloc[0].copy()

            # If _df has only one row, the original file may have no data rows.
            # Try reading using the header row as reference (but it may have issues sometimes)
            if len(_df) == 1:
                _df = pandas.read_fwf(path, skiprows=[0], nrows=2, header=None)
                self.units_row = utils._clean(_df).iloc[1].copy()
        else:
            self.units_row = None

        # Check if units row matches the DataFrame's column count
        if self.has_units:
            if len(self.units_row) != self.df.shape[1]:
                raise ValueError(
                    "Units row could not be parsed correctly. Check if your file is well-formed."
                )

        self.path = path

    def overwrite_file(
        self
    ) -> None:
        '''
        Overwrite the original TXT file with the modified DataFrame content.
        If the file originally contained a unit row (below the header),
        it will be preserved and written back as part of the output.
        If the file is a SWAT+ Output File, launch exception.
        '''
        if self.is_output_file:
            raise ValueError("Overwriting SWAT+ Output Files is not allowed")

        if self.units_row is not None:
            _df = pandas.concat([pandas.DataFrame([self.units_row]), self.df], ignore_index=True)
        else:
            _df = self.df

        # Replace NaN with empty strings to avoid printing 'NaN'
        _df = _df.fillna('')

        with open(self.path, 'w') as file:
            # Write the header file first
            file.write(self.header_file)

            if _df.empty:
                # Calculate max width for each column name
                col_widths = [max(len(col), 1) + 3 for col in _df.columns]

                # Create format string with fixed widths, right-aligned
                fmt = ''.join([f'{{:>{w}}}' for w in col_widths])

                # Format and write the header line
                file.write(fmt.format(*_df.columns) + '\n')
                return

            max_lengths = _df.apply(lambda x: x.astype(str).str.len()).max()
            column_widths = {column: max_length + 3 for column, max_length in max_lengths.items()}
            data_str = _df.to_string(index=False, justify='right', col_space=column_widths)
            file.write(data_str)

`init(path: str | pathlib.Path, has_units: bool)`

Initialize a FileReader instance to read data from a TXT file.

Parameters:

Name	Type	Description	Default
`path`	`str or Path`	Path to the TXT file to be read.	required
`has_units`	`bool`	If `True`, the second row of the file contains units.	required

Example

reader = FileReader(
    path='C:\users\username\project\Scenarios\Default\TxtInOut\plants.plt',
    has_units=False
)

Source code in pySWATPlus/filereader.py

def __init__(
    self,
    path: str | pathlib.Path,
    has_units: bool,
):
    '''
    Initialize a FileReader instance to read data from a TXT file.

    Args:
        path (str or Path): Path to the TXT file to be read.
        has_units (bool): If `True`, the second row of the file contains units.

    Example:
        ```python
        reader = FileReader(
            path='C:\\users\\username\\project\\Scenarios\\Default\\TxtInOut\\plants.plt',
            has_units=False
        )
        ```
    '''

    if not isinstance(path, (str, pathlib.Path)):
        raise TypeError("path must be a string or Path object")

    path = pathlib.Path(path).resolve()

    if not path.is_file():
        raise FileNotFoundError("file does not exist")

    self.has_units = has_units

    # if output ends with _day, _mon, _yr, _aa, _subday (removing the suffix), it means is an output file from SWAT.
    # if file is a csv is output file
    self.is_output_file = path.stem.endswith(('_day', '_mon', '_yr', '_aa', '_subday')) or path.suffix == '.csv'

    # skips the header
    skip_rows = [0, 2] if self.has_units else [0]

    # read only first line of file
    with open(path, 'r', encoding='latin-1') as file:
        self.header_file = file.readline()

    self.df = utils._load_file(path, skip_rows=skip_rows)

    # if file is a csv is output file
    if path.suffix == '.csv' and self.has_units:
        _df = pandas.read_csv(path, skiprows=[0], nrows=2, header=None, skipinitialspace=True)
        self.units_row = utils._clean(_df).iloc[1].copy()

    elif self.has_units:  # has_units and txt file
        # Units row may have some empty values, so we cannot use read_csv.
        # We'll use read_fwf; infer number of columns using first data row.
        _df = pandas.read_fwf(path, skiprows=[0, 1], nrows=2, header=None)
        self.units_row = utils._clean(_df).iloc[0].copy()

        # If _df has only one row, the original file may have no data rows.
        # Try reading using the header row as reference (but it may have issues sometimes)
        if len(_df) == 1:
            _df = pandas.read_fwf(path, skiprows=[0], nrows=2, header=None)
            self.units_row = utils._clean(_df).iloc[1].copy()
    else:
        self.units_row = None

    # Check if units row matches the DataFrame's column count
    if self.has_units:
        if len(self.units_row) != self.df.shape[1]:
            raise ValueError(
                "Units row could not be parsed correctly. Check if your file is well-formed."
            )

    self.path = path

`overwrite_file() -> None`

Overwrite the original TXT file with the modified DataFrame content. If the file originally contained a unit row (below the header), it will be preserved and written back as part of the output. If the file is a SWAT+ Output File, launch exception.

Source code in pySWATPlus/filereader.py

def overwrite_file(
    self
) -> None:
    '''
    Overwrite the original TXT file with the modified DataFrame content.
    If the file originally contained a unit row (below the header),
    it will be preserved and written back as part of the output.
    If the file is a SWAT+ Output File, launch exception.
    '''
    if self.is_output_file:
        raise ValueError("Overwriting SWAT+ Output Files is not allowed")

    if self.units_row is not None:
        _df = pandas.concat([pandas.DataFrame([self.units_row]), self.df], ignore_index=True)
    else:
        _df = self.df

    # Replace NaN with empty strings to avoid printing 'NaN'
    _df = _df.fillna('')

    with open(self.path, 'w') as file:
        # Write the header file first
        file.write(self.header_file)

        if _df.empty:
            # Calculate max width for each column name
            col_widths = [max(len(col), 1) + 3 for col in _df.columns]

            # Create format string with fixed widths, right-aligned
            fmt = ''.join([f'{{:>{w}}}' for w in col_widths])

            # Format and write the header line
            file.write(fmt.format(*_df.columns) + '\n')
            return

        max_lengths = _df.apply(lambda x: x.astype(str).str.len()).max()
        column_widths = {column: max_length + 3 for column, max_length in max_lengths.items()}
        data_str = _df.to_string(index=False, justify='right', col_space=column_widths)
        file.write(data_str)

FileReader

FileReader

__init__(path: str | pathlib.Path, has_units: bool)

overwrite_file() -> None

`FileReader`

`init(path: str | pathlib.Path, has_units: bool)`

`overwrite_file() -> None`