Spaces:

lamonkey
/

portfolio_management

Sleeping

App Files Files Community

portfolio_management / api.py

huggingface112

imp left_fill, right_fill and update log

2b059b0 about 1 year ago

raw

history blame contribute delete

No virus

10.5 kB


	'''
	contain method for api call to jqdatasdk
	'''
	from dotenv import load_dotenv
	from datetime import datetime, timedelta
	import jqdatasdk as jq
	import pandas as pd
	from typing import List, Optional
	from sqlalchemy import create_engine
	import table_schema as ts
	import os
	import utils

	db_url = 'sqlite:///instance/local.db'
	load_dotenv()
	user_name = os.environ.get('JQDATA_USER')
	password = os.environ.get('JQDATA_PASSWORD')


	def auth_api(func):
	"""
	decorator for function require jqdatasdk api
	"""
	def wrapper(args, *kwargs):

	if (not jq.is_auth()):
	jq.auth(user_name, password)

	result = func(args, *kwargs)
	return result

	return wrapper


	def aggregate_sector(input: str) -> Optional[str]:
	'''
	mapping from sector to aggregated sector retur None if not found
	this handling is for spotting undefined sector in current mapping
	later

	Return: str -- aggregated sector
	None if no mapping
	'''
	mapping = {
	'电气设备I': '工业',
	'建筑装饰I': '工业',
	'交通运输I': '工业',
	'机械设备I': '工业',
	'国防军工I': '工业',
	'综合I': '工业',
	'电子I': '信息与通信',
	'计算机I': '信息与通信',
	'通信I': '信息与通信',
	'传媒I': '信息与通信',
	'纺织服装I': '消费',
	'家用电器I': '消费',
	'汽车I': '消费',
	'休闲服务I': '消费',
	'商业贸易I': '消费',
	'食品饮料I': '消费',
	'美容护理I': '消费',
	'农林牧渔I': '消费',
	'钢铁I': '原料与能源',
	'建筑材料I': '原料与能源',
	'有色金属I': '原料与能源',
	'化工I': '原料与能源',
	'轻工制造I': '原料与能源',
	'煤炭I': '原料与能源',
	'石油石化I': '原料与能源',
	'采掘I': '原料与能源',
	'医药生物I': '医药卫生',
	'公用事业I': '公用事业',
	'环保I': '公用事业',
	'房地产I': '金融与地产',
	'银行I': '金融与地产',
	'非银金融I': '金融与地产'
	}
	# return the first mapping found
	sectors = input.split(" ")
	maped_name = "其他"
	for sector in sectors:
	maped_name = mapping.get(sector, None)
	if maped_name is not None:
	return maped_name

	return maped_name


	@auth_api
	def get_all_stock_info() -> tuple[pd.DataFrame, List[str]]:
	'''
	return all stock information

	Return
	------
	tuple: tuple(pd.DataFrame, List[str])
	DataFrame -- display_name \| name \| start_date \| end_date \| type
	'''
	error = []
	try:
	df = jq.get_all_securities()
	df['ticker'] = df.index
	df.reset_index(drop=True, inplace=True)
	# df.reset_index(inplace=True)
	return df, error
	except Exception as e:
	error.append(f'get_all_stock_info\n{e}')
	return None, error


	@auth_api
	def add_detail_to_stocks(df: pd.DataFrame) -> List[str]:
	"""
	add display_name, name, sector, and aggregate sector to each stock if not exist already
	return a list of error message

	Args: pd.DataFrame
	ticker \| date \| weight \| sector \| aggregate_sector \| display_name \| name

	Returns: List[str], error messages
	"""
	error = []
	df[['sector', 'aggregate_sector']] = df.groupby(
	'ticker')[['sector', 'aggregate_sector']].ffill()
	df[['display_name', 'name']] = df.groupby(
	'ticker')[['display_name', 'name']].ffill()
	not_have_sector = list(
	df[df['aggregate_sector'].isnull()]['ticker'].unique())
	not_have_name = list(df[df['name'].isnull()]['ticker'].unique())
	# sector and aggregate sector
	if len(not_have_sector) != 0:
	try:
	sectors = jq.get_industry(security=not_have_sector)
	df['sector'] = df.apply(lambda x: x.sector if not pd.isna(x.sector)
	else " ".join(value['industry_name']
	for value in sectors[x.ticker].values()), axis=1)
	df['aggregate_sector'] = df.apply(
	lambda x: x.aggregate_sector if not pd.isna(x.aggregate_sector)
	else aggregate_sector(x.sector), axis=1
	)
	except Exception as e:
	error.append(f'Error on creaet_sector_information\n{ticker}\n{e}')

	# display_name and name
	if len(not_have_name) != 0:
	try:
	for ticker in not_have_name:
	detail = jq.get_security_info(ticker)
	df.loc[df.ticker.isin(not_have_name)
	]['display_name'] = detail.display_name
	df.loc[df.ticker.isin(not_have_name)]['name'] = detail.name
	except Exception as e:
	error.append(f'Error on get display_name and name\n{ticker}\n{e}')

	return error


	@auth_api
	def update_portfolio_profile(stocks: List[dict], current_p: pd.DataFrame = None) -> tuple[pd.DataFrame, List[str]]:
	"""create or update a portfolio profile,
	return a time series of profile

	Parameters
	----------
	stocks : List[{ticker: Str, shares: float, date:datetime}]

	update profile with a list of stock information

	current_p : pd.DataFrame, optional
	current portfolio profile, default is None

	Returns
	-------
	updated_profile : pd.DataFrame
	ticker \| date \| weight \| sector \| aggregate_sector \| display_name \| name

	error : List[str]
	a list of error message
	"""

	error = []
	profile_df = pd.DataFrame(stocks)
	profile_df['sector'] = None
	profile_df['aggregate_sector'] = None

	# add display_name
	try:
	with create_engine(db_url).connect() as conn:
	info_df = pd.read_sql_table(ts.STOCKS_DETAILS_TABLE, conn)
	profile_df = pd.merge(
	profile_df, info_df[['display_name', 'ticker', 'name', 'aggregate_sector', ]], on='ticker', how='left')
	except Exception as e:
	error.append(f'create_portfolio \n{e}')

	# get sector information
	incoming_error = add_detail_to_stocks(profile_df)
	error.extend(incoming_error)

	# concate to existing profile if exist
	if current_p is not None:
	profile_df = pd.concat([profile_df, current_p], ignore_index=True)
	profile_df.drop_duplicates(
	subset=['ticker', 'date'], keep='last', inplace=True)
	profile_df.reset_index(drop=True, inplace=True)

	return profile_df, error


	@auth_api
	def get_all_stocks_detail():
	'''get df contain all stock display_name, name, sector, aggregate_sector'''
	detail_df = jq.get_all_securities()
	detail_df['ticker'] = detail_df.index
	detail_df.reset_index(drop=True, inplace=True)
	industry_info = jq.get_industry(detail_df.ticker.to_list())
	detail_df['sector'] = detail_df.apply(lambda x: " ".join(
	value['industry_name']for value in industry_info[x.ticker].values()), axis=1)
	detail_df['aggregate_sector'] = detail_df.apply(
	lambda x: aggregate_sector(x.sector), axis=1)
	return detail_df


	@auth_api
	def get_api_usage():
	return jq.get_query_count()


	@auth_api
	def get_stocks_price(profile: pd.DataFrame, start_date: datetime, end_date: datetime, frequency='daily') -> tuple[pd.DataFrame, List[str]]:
	"""
	Return a dataframe contain stock price between period of time for price in a portfolio profile

	Arguments:
	profile {pd.DataFrame} -- ticker \| date \| weight \| sector \| aggregate_sector \| display_name \| name
	start_date {datetime} -- start date of the period include start date
	end_date {datetime} -- end date of the period include end date
	frequency {str} -- resolution of the price, default is daily

	Returns: Tuple(pd.DataFrame, List[str])
	pd.DataFrame -- ticker date open close high low volumn money
	error_message {list} -- a list of error message
	"""
	error_message = []
	start_str = start_date.strftime('%Y-%m-%d')
	end_str = end_date.strftime('%Y-%m-%d')
	if profile.date.min() < start_date:
	# hanlde benchmark doesn't have weight on the exact date
	start_str = profile.date.min().strftime('%Y-%m-%d')

	ticker = profile['ticker'].to_list()
	try:

	data = jq.get_price(ticker, start_date=start_str,
	end_date=end_str, frequency=frequency)
	data.rename(columns={'time': 'date', 'code': "ticker"}, inplace=True)
	return data, error_message
	except Exception as e:
	error_message.append(f'Error when fetching {ticker} \n {e}')
	return None, error_message


	@auth_api
	def fetch_stocks_price(**params):
	'''request list of stock price from start_date to end_date with frequency or count'''
	stocks_df = jq.get_price(**params)
	stocks_df.rename(columns={'code': 'ticker'}, inplace=True)
	return stocks_df

	@auth_api
	def fetch_benchmark_profile(start_date: datetime, end_date: datetime, delta_time=timedelta(days=30), benchmark="000905.XSHG"):
	'''
	fetch benchmark profile from start_date to end_date with delta_time

	Parameters
	----------
	start_date : datetime
	start date of the period include start date
	end_date : datetime
	end date of the period include end date
	delta_time : timedelta, optional
	the default is 30 days since the jq api only update index weight once every month
	'''
	if end_date < start_date:
	raise Exception('end_date must be greater than start_date')

	results = []
	# handle end_date == start_date
	while start_date < end_date:
	try:
	date_str = start_date.strftime('%Y-%m-%d')
	result = jq.get_index_weights(benchmark, date=date_str)
	results.append(result)
	except Exception as e:
	print(f'Error when fetching {benchmark}\n\
	update on {date_str} is missing\n\
	{e}')
	start_date += delta_time
	update_df = pd.concat(results)
	update_df['ticker'] = update_df.index
	update_df['date'] = pd.to_datetime(update_df['date'])
	# update_df.rename({'date': 'time'}, inplace=True, axis=1)
	# remove duplicate row
	update_df = update_df.drop_duplicates(
	subset=['ticker', 'date'], keep='last')
	update_df.reset_index(drop=True, inplace=True)
	return update_df