Compare commits
	
		
			5 Commits
		
	
	
		
			58524aae7e
			...
			cd05250e8a
		
	
	| Author | SHA1 | Date | |
|---|---|---|---|
| cd05250e8a | |||
| 47e11546a0 | |||
| 141ec97a2c | |||
| 439fa86b5c | |||
| 2c1d508734 | 
							
								
								
									
										118
									
								
								fincal/core.py
									
									
									
									
									
								
							
							
						
						
									
										118
									
								
								fincal/core.py
									
									
									
									
									
								
							| @ -1,5 +1,6 @@ | |||||||
| import datetime | import datetime | ||||||
| from dataclasses import dataclass | from dataclasses import dataclass | ||||||
|  | from numbers import Number | ||||||
| from typing import Iterable, List, Literal, Mapping, Sequence, Tuple, Union | from typing import Iterable, List, Literal, Mapping, Sequence, Tuple, Union | ||||||
| 
 | 
 | ||||||
| 
 | 
 | ||||||
| @ -111,6 +112,67 @@ class IndexSlicer: | |||||||
|         return item |         return item | ||||||
| 
 | 
 | ||||||
| 
 | 
 | ||||||
|  | class Series: | ||||||
|  |     def __init__(self, data): | ||||||
|  |         if not isinstance(data, Sequence): | ||||||
|  |             raise TypeError("Series only supports creation using Sequence types") | ||||||
|  | 
 | ||||||
|  |         if isinstance(data[0], bool): | ||||||
|  |             self.data = data | ||||||
|  |             self.dtype = bool | ||||||
|  |         elif isinstance(data[0], Number): | ||||||
|  |             self.dtype = float | ||||||
|  |             self.data = [float(i) for i in data] | ||||||
|  |         elif isinstance(data[0], str): | ||||||
|  |             try: | ||||||
|  |                 data = [datetime.datetime.strptime(i, FincalOptions.date_format) for i in data] | ||||||
|  |                 self.dtype = datetime.datetime | ||||||
|  |             except ValueError: | ||||||
|  |                 raise TypeError("Series does not support string data type") | ||||||
|  |         elif isinstance(data[0], datetime.datetime): | ||||||
|  |             self.dtype = datetime.datetime | ||||||
|  |             self.data = data | ||||||
|  |         else: | ||||||
|  |             raise TypeError(f"Cannot create series object from {type(data).__name__} of {type(data[0]).__name__}") | ||||||
|  | 
 | ||||||
|  |     def __repr__(self): | ||||||
|  |         return f"{self.__class__.__name__}({self.data})" | ||||||
|  | 
 | ||||||
|  |     def __getitem__(self, n): | ||||||
|  |         return self.data[n] | ||||||
|  | 
 | ||||||
|  |     def __len__(self): | ||||||
|  |         return len(self.data) | ||||||
|  | 
 | ||||||
|  |     def __gt__(self, other): | ||||||
|  |         if self.dtype == bool: | ||||||
|  |             raise TypeError("> not supported for boolean series") | ||||||
|  | 
 | ||||||
|  |         if self.dtype == float and isinstance(other, Number) or isinstance(other, self.dtype): | ||||||
|  |             gt = Series([i > other for i in self.data]) | ||||||
|  |         else: | ||||||
|  |             raise Exception(f"Cannot compare type {self.dtype.__name__} to {type(other).__name__}") | ||||||
|  | 
 | ||||||
|  |         return gt | ||||||
|  | 
 | ||||||
|  |     def __lt__(self, other): | ||||||
|  |         if self.dtype == bool: | ||||||
|  |             raise TypeError("< not supported for boolean series") | ||||||
|  | 
 | ||||||
|  |         if self.dtype == float and isinstance(other, Number) or isinstance(other, self.dtype): | ||||||
|  |             lt = Series([i < other for i in self.data]) | ||||||
|  |         else: | ||||||
|  |             raise Exception(f"Cannot compare type {self.dtype.__name__} to {type(other).__name__}") | ||||||
|  |         return lt | ||||||
|  | 
 | ||||||
|  |     def __eq__(self, other): | ||||||
|  |         if self.dtype == float and isinstance(other, Number) or isinstance(other, self.dtype): | ||||||
|  |             eq = Series([i == other for i in self.data]) | ||||||
|  |         else: | ||||||
|  |             raise Exception(f"Cannot compare type {self.dtype.__name__} to {type(other).__name__}") | ||||||
|  |         return eq | ||||||
|  | 
 | ||||||
|  | 
 | ||||||
| class TimeSeriesCore: | class TimeSeriesCore: | ||||||
|     """Defines the core building blocks of a TimeSeries object""" |     """Defines the core building blocks of a TimeSeries object""" | ||||||
| 
 | 
 | ||||||
| @ -142,12 +204,36 @@ class TimeSeriesCore: | |||||||
|         data = _preprocess_timeseries(data, date_format=date_format) |         data = _preprocess_timeseries(data, date_format=date_format) | ||||||
| 
 | 
 | ||||||
|         self.time_series = dict(data) |         self.time_series = dict(data) | ||||||
|         self.dates = list(self.time_series) |  | ||||||
|         if len(self.time_series) != len(data): |         if len(self.time_series) != len(data): | ||||||
|             print("Warning: The input data contains duplicate dates which have been ignored.") |             print("Warning: The input data contains duplicate dates which have been ignored.") | ||||||
|         self.start_date = self.dates[0] |  | ||||||
|         self.end_date = self.dates[-1] |  | ||||||
|         self.frequency = getattr(AllFrequencies, frequency) |         self.frequency = getattr(AllFrequencies, frequency) | ||||||
|  |         self.iter_num = -1 | ||||||
|  |         self._dates = None | ||||||
|  |         self._values = None | ||||||
|  |         self._start_date = None | ||||||
|  |         self._end_date = None | ||||||
|  | 
 | ||||||
|  |     @property | ||||||
|  |     def dates(self): | ||||||
|  |         if self._dates is None or len(self._dates) != len(self.time_series): | ||||||
|  |             self._dates = list(self.time_series.keys()) | ||||||
|  | 
 | ||||||
|  |         return Series(self._dates) | ||||||
|  | 
 | ||||||
|  |     @property | ||||||
|  |     def values(self): | ||||||
|  |         if self._values is None or len(self._values) != len(self.time_series): | ||||||
|  |             self._values = list(self.time_series.values()) | ||||||
|  | 
 | ||||||
|  |         return Series(self._values) | ||||||
|  | 
 | ||||||
|  |     @property | ||||||
|  |     def start_date(self): | ||||||
|  |         return self.dates[0] | ||||||
|  | 
 | ||||||
|  |     @property | ||||||
|  |     def end_date(self): | ||||||
|  |         return self.dates[-1] | ||||||
| 
 | 
 | ||||||
|     def _get_printable_slice(self, n: int): |     def _get_printable_slice(self, n: int): | ||||||
|         """Returns a slice of the dataframe from beginning and end""" |         """Returns a slice of the dataframe from beginning and end""" | ||||||
| @ -193,11 +279,25 @@ class TimeSeriesCore: | |||||||
|         return printable_str |         return printable_str | ||||||
| 
 | 
 | ||||||
|     def __getitem__(self, key): |     def __getitem__(self, key): | ||||||
|  |         if isinstance(key, Series): | ||||||
|  |             if not key.dtype == bool: | ||||||
|  |                 raise ValueError(f"Cannot slice {self.__class__.__name__} using a Series of {key.dtype.__name__}") | ||||||
|  |             elif len(key) != len(self.dates): | ||||||
|  |                 raise Exception(f"Length of Series: {len(key)} did not match length of object: {len(self.dates)}") | ||||||
|  |             else: | ||||||
|  |                 dates_to_return = [self.dates[i] for i, j in enumerate(key) if j] | ||||||
|  |                 data_to_return = [(key, self.time_series[key]) for key in dates_to_return] | ||||||
|  |                 return TimeSeriesCore(data_to_return) | ||||||
|  | 
 | ||||||
|         if isinstance(key, int): |         if isinstance(key, int): | ||||||
|             raise KeyError(f"{key}. For index based slicing, use .iloc[{key}]") |             raise KeyError(f"{key}. For index based slicing, use .iloc[{key}]") | ||||||
|         elif isinstance(key, datetime.datetime): |         elif isinstance(key, datetime.datetime): | ||||||
|             item = (key, self.time_series[key]) |             item = (key, self.time_series[key]) | ||||||
|         if isinstance(key, str): |         if isinstance(key, str): | ||||||
|  |             if key == 'dates': | ||||||
|  |                 return self.dates | ||||||
|  |             elif key == 'values': | ||||||
|  |                 return list(self.time_series.values()) | ||||||
|             try: |             try: | ||||||
|                 dt_key = datetime.datetime.strptime(key, FincalOptions.date_format) |                 dt_key = datetime.datetime.strptime(key, FincalOptions.date_format) | ||||||
|                 item = (dt_key, self.time_series[dt_key]) |                 item = (dt_key, self.time_series[dt_key]) | ||||||
| @ -215,6 +315,18 @@ class TimeSeriesCore: | |||||||
|     def __len__(self): |     def __len__(self): | ||||||
|         return len(self.time_series) |         return len(self.time_series) | ||||||
| 
 | 
 | ||||||
|  |     def __iter__(self): | ||||||
|  |         self.n = 0 | ||||||
|  |         return self | ||||||
|  | 
 | ||||||
|  |     def __next__(self): | ||||||
|  |         if self.n >= len(self.dates): | ||||||
|  |             raise StopIteration | ||||||
|  |         else: | ||||||
|  |             key = self.dates[self.n] | ||||||
|  |             self.n += 1 | ||||||
|  |             return key, self.time_series[key] | ||||||
|  | 
 | ||||||
|     def head(self, n: int = 6): |     def head(self, n: int = 6): | ||||||
|         """Returns the first n items of the TimeSeries object""" |         """Returns the first n items of the TimeSeries object""" | ||||||
| 
 | 
 | ||||||
|  | |||||||
| @ -75,7 +75,7 @@ class TimeSeries(TimeSeriesCore): | |||||||
|             self.time_series = new_ts |             self.time_series = new_ts | ||||||
|             return None |             return None | ||||||
| 
 | 
 | ||||||
|         return new_ts |         return TimeSeries(new_ts, frequency=self.frequency.symbol) | ||||||
| 
 | 
 | ||||||
|     def bfill(self, inplace: bool = False, limit: int = None) -> Union[TimeSeries, None]: |     def bfill(self, inplace: bool = False, limit: int = None) -> Union[TimeSeries, None]: | ||||||
|         """Backward fill missing dates in the time series |         """Backward fill missing dates in the time series | ||||||
| @ -109,7 +109,7 @@ class TimeSeries(TimeSeriesCore): | |||||||
|             self.time_series = new_ts |             self.time_series = new_ts | ||||||
|             return None |             return None | ||||||
| 
 | 
 | ||||||
|         return new_ts |         return TimeSeries(new_ts, frequency=self.frequency.symbol) | ||||||
| 
 | 
 | ||||||
|     def calculate_returns( |     def calculate_returns( | ||||||
|         self, |         self, | ||||||
|  | |||||||
							
								
								
									
										129
									
								
								testing.ipynb
									
									
									
									
									
										Normal file
									
								
							
							
						
						
									
										129
									
								
								testing.ipynb
									
									
									
									
									
										Normal file
									
								
							| @ -0,0 +1,129 @@ | |||||||
|  | { | ||||||
|  |  "cells": [ | ||||||
|  |   { | ||||||
|  |    "cell_type": "code", | ||||||
|  |    "execution_count": 14, | ||||||
|  |    "id": "3f7938c0-98e3-43b8-86e8-4f000cda7ce5", | ||||||
|  |    "metadata": {}, | ||||||
|  |    "outputs": [], | ||||||
|  |    "source": [ | ||||||
|  |     "import datetime\n", | ||||||
|  |     "import pandas as pd\n", | ||||||
|  |     "\n", | ||||||
|  |     "from fincal.fincal import TimeSeries\n", | ||||||
|  |     "from fincal.core import Series" | ||||||
|  |    ] | ||||||
|  |   }, | ||||||
|  |   { | ||||||
|  |    "cell_type": "code", | ||||||
|  |    "execution_count": 16, | ||||||
|  |    "id": "757eafc2-f804-4e7e-a3b8-2d09cd62e646", | ||||||
|  |    "metadata": {}, | ||||||
|  |    "outputs": [], | ||||||
|  |    "source": [ | ||||||
|  |     "dfd = pd.read_csv('test_files/nav_history_daily - copy.csv')" | ||||||
|  |    ] | ||||||
|  |   }, | ||||||
|  |   { | ||||||
|  |    "cell_type": "code", | ||||||
|  |    "execution_count": 17, | ||||||
|  |    "id": "59b3d4a9-8ef4-4652-9e20-1bac69ab4ff9", | ||||||
|  |    "metadata": {}, | ||||||
|  |    "outputs": [], | ||||||
|  |    "source": [ | ||||||
|  |     "dfd = dfd[dfd['amfi_code'] == 118825].reset_index(drop=True)" | ||||||
|  |    ] | ||||||
|  |   }, | ||||||
|  |   { | ||||||
|  |    "cell_type": "code", | ||||||
|  |    "execution_count": 19, | ||||||
|  |    "id": "4bc95ae0-8c33-4eab-acf9-e765d22979b8", | ||||||
|  |    "metadata": {}, | ||||||
|  |    "outputs": [ | ||||||
|  |     { | ||||||
|  |      "name": "stdout", | ||||||
|  |      "output_type": "stream", | ||||||
|  |      "text": [ | ||||||
|  |       "Warning: The input data contains duplicate dates which have been ignored.\n" | ||||||
|  |      ] | ||||||
|  |     } | ||||||
|  |    ], | ||||||
|  |    "source": [ | ||||||
|  |     "ts = TimeSeries([(i.date, i.nav) for i in dfd.itertuples()], frequency='D')" | ||||||
|  |    ] | ||||||
|  |   }, | ||||||
|  |   { | ||||||
|  |    "cell_type": "code", | ||||||
|  |    "execution_count": 20, | ||||||
|  |    "id": "f2c3218c-3984-43d6-8638-41a74a9d0b58", | ||||||
|  |    "metadata": {}, | ||||||
|  |    "outputs": [ | ||||||
|  |     { | ||||||
|  |      "data": { | ||||||
|  |       "text/plain": [ | ||||||
|  |        "TimeSeries([(datetime.datetime(2013, 1, 2, 0, 0), 18.972),\n", | ||||||
|  |        "\t    (datetime.datetime(2013, 1, 3, 0, 0), 19.011),\n", | ||||||
|  |        "\t    (datetime.datetime(2013, 1, 4, 0, 0), 19.008)\n", | ||||||
|  |        "\t    ...\n", | ||||||
|  |        "\t    (datetime.datetime(2022, 2, 10, 0, 0), 86.5),\n", | ||||||
|  |        "\t    (datetime.datetime(2022, 2, 11, 0, 0), 85.226),\n", | ||||||
|  |        "\t    (datetime.datetime(2022, 2, 14, 0, 0), 82.53299999999999)], frequency='D')" | ||||||
|  |       ] | ||||||
|  |      }, | ||||||
|  |      "execution_count": 20, | ||||||
|  |      "metadata": {}, | ||||||
|  |      "output_type": "execute_result" | ||||||
|  |     } | ||||||
|  |    ], | ||||||
|  |    "source": [ | ||||||
|  |     "ts" | ||||||
|  |    ] | ||||||
|  |   }, | ||||||
|  |   { | ||||||
|  |    "cell_type": "code", | ||||||
|  |    "execution_count": 22, | ||||||
|  |    "id": "dc469722-c816-4b57-8d91-7a3b865f86be", | ||||||
|  |    "metadata": {}, | ||||||
|  |    "outputs": [ | ||||||
|  |     { | ||||||
|  |      "ename": "TypeError", | ||||||
|  |      "evalue": "getattr(): attribute name must be string", | ||||||
|  |      "output_type": "error", | ||||||
|  |      "traceback": [ | ||||||
|  |       "\u001b[1;31m---------------------------------------------------------------------------\u001b[0m", | ||||||
|  |       "\u001b[1;31mTypeError\u001b[0m                                 Traceback (most recent call last)", | ||||||
|  |       "File \u001b[1;32m<timed eval>:1\u001b[0m, in \u001b[0;36m<module>\u001b[1;34m\u001b[0m\n", | ||||||
|  |       "File \u001b[1;32mD:\\Documents\\Projects\\fincal\\fincal\\fincal.py:203\u001b[0m, in \u001b[0;36mTimeSeries.calculate_rolling_returns\u001b[1;34m(self, from_date, to_date, frequency, as_on_match, prior_match, closest, compounding, years)\u001b[0m\n\u001b[0;32m    200\u001b[0m \u001b[38;5;28;01mexcept\u001b[39;00m \u001b[38;5;167;01mAttributeError\u001b[39;00m:\n\u001b[0;32m    201\u001b[0m     \u001b[38;5;28;01mraise\u001b[39;00m \u001b[38;5;167;01mValueError\u001b[39;00m(\u001b[38;5;124mf\u001b[39m\u001b[38;5;124m\"\u001b[39m\u001b[38;5;124mInvalid argument for frequency \u001b[39m\u001b[38;5;132;01m{\u001b[39;00mfrequency\u001b[38;5;132;01m}\u001b[39;00m\u001b[38;5;124m\"\u001b[39m)\n\u001b[1;32m--> 203\u001b[0m dates \u001b[38;5;241m=\u001b[39m \u001b[43mcreate_date_series\u001b[49m\u001b[43m(\u001b[49m\u001b[43mfrom_date\u001b[49m\u001b[43m,\u001b[49m\u001b[43m \u001b[49m\u001b[43mto_date\u001b[49m\u001b[43m,\u001b[49m\u001b[43m \u001b[49m\u001b[43mfrequency\u001b[49m\u001b[43m)\u001b[49m\n\u001b[0;32m    204\u001b[0m \u001b[38;5;28;01mif\u001b[39;00m frequency \u001b[38;5;241m==\u001b[39m AllFrequencies\u001b[38;5;241m.\u001b[39mD:\n\u001b[0;32m    205\u001b[0m     dates \u001b[38;5;241m=\u001b[39m [i \u001b[38;5;28;01mfor\u001b[39;00m i \u001b[38;5;129;01min\u001b[39;00m dates \u001b[38;5;28;01mif\u001b[39;00m i \u001b[38;5;129;01min\u001b[39;00m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39mtime_series]\n", | ||||||
|  |       "File \u001b[1;32mD:\\Documents\\Projects\\fincal\\fincal\\fincal.py:16\u001b[0m, in \u001b[0;36mcreate_date_series\u001b[1;34m(start_date, end_date, frequency, eomonth)\u001b[0m\n\u001b[0;32m     11\u001b[0m \u001b[38;5;28;01mdef\u001b[39;00m \u001b[38;5;21mcreate_date_series\u001b[39m(\n\u001b[0;32m     12\u001b[0m     start_date: datetime\u001b[38;5;241m.\u001b[39mdatetime, end_date: datetime\u001b[38;5;241m.\u001b[39mdatetime, frequency: \u001b[38;5;28mstr\u001b[39m, eomonth: \u001b[38;5;28mbool\u001b[39m \u001b[38;5;241m=\u001b[39m \u001b[38;5;28;01mFalse\u001b[39;00m\n\u001b[0;32m     13\u001b[0m ) \u001b[38;5;241m-\u001b[39m\u001b[38;5;241m>\u001b[39m List[datetime\u001b[38;5;241m.\u001b[39mdatetime]:\n\u001b[0;32m     14\u001b[0m     \u001b[38;5;124;03m\"\"\"Creates a date series using a frequency\"\"\"\u001b[39;00m\n\u001b[1;32m---> 16\u001b[0m     frequency \u001b[38;5;241m=\u001b[39m \u001b[38;5;28;43mgetattr\u001b[39;49m\u001b[43m(\u001b[49m\u001b[43mAllFrequencies\u001b[49m\u001b[43m,\u001b[49m\u001b[43m \u001b[49m\u001b[43mfrequency\u001b[49m\u001b[43m)\u001b[49m\n\u001b[0;32m     17\u001b[0m     \u001b[38;5;28;01mif\u001b[39;00m eomonth \u001b[38;5;129;01mand\u001b[39;00m frequency\u001b[38;5;241m.\u001b[39mdays \u001b[38;5;241m<\u001b[39m AllFrequencies\u001b[38;5;241m.\u001b[39mM\u001b[38;5;241m.\u001b[39mdays:\n\u001b[0;32m     18\u001b[0m         \u001b[38;5;28;01mraise\u001b[39;00m \u001b[38;5;167;01mValueError\u001b[39;00m(\u001b[38;5;124mf\u001b[39m\u001b[38;5;124m\"\u001b[39m\u001b[38;5;124meomonth cannot be set to True if frequency is higher than \u001b[39m\u001b[38;5;132;01m{\u001b[39;00mAllFrequencies\u001b[38;5;241m.\u001b[39mM\u001b[38;5;241m.\u001b[39mname\u001b[38;5;132;01m}\u001b[39;00m\u001b[38;5;124m\"\u001b[39m)\n", | ||||||
|  |       "\u001b[1;31mTypeError\u001b[0m: getattr(): attribute name must be string" | ||||||
|  |      ] | ||||||
|  |     } | ||||||
|  |    ], | ||||||
|  |    "source": [ | ||||||
|  |     "%%time\n", | ||||||
|  |     "ts.calculate_rolling_returns(from_date='2020-01-01', to_date='2021-01-01')" | ||||||
|  |    ] | ||||||
|  |   } | ||||||
|  |  ], | ||||||
|  |  "metadata": { | ||||||
|  |   "kernelspec": { | ||||||
|  |    "display_name": "Python 3 (ipykernel)", | ||||||
|  |    "language": "python", | ||||||
|  |    "name": "python3" | ||||||
|  |   }, | ||||||
|  |   "language_info": { | ||||||
|  |    "codemirror_mode": { | ||||||
|  |     "name": "ipython", | ||||||
|  |     "version": 3 | ||||||
|  |    }, | ||||||
|  |    "file_extension": ".py", | ||||||
|  |    "mimetype": "text/x-python", | ||||||
|  |    "name": "python", | ||||||
|  |    "nbconvert_exporter": "python", | ||||||
|  |    "pygments_lexer": "ipython3", | ||||||
|  |    "version": "3.8.3" | ||||||
|  |   } | ||||||
|  |  }, | ||||||
|  |  "nbformat": 4, | ||||||
|  |  "nbformat_minor": 5 | ||||||
|  | } | ||||||
		Loading…
	
		Reference in New Issue
	
	Block a user