add historical pe ratio to industry

2024-09-17 21:12:05 +02:00 · 2024-09-17 21:12:05 +02:00 · 232d167733
commit 232d167733
parent 006fe42073
3 changed files with 68 additions and 21 deletions
--- a/app/cron_industry.py
+++ b/app/cron_industry.py
@ -5,6 +5,7 @@ import asyncio
 import pandas as pd
 from tqdm import tqdm
 import orjson
 from datetime import datetime, timedelta
 from GetStartEndDate import GetStartEndDate
 from collections import defaultdict
 import re
@ -16,17 +17,6 @@ api_key = os.getenv('FMP_API_KEY')
 with open(f"json/stock-screener/data.json", 'rb') as file:
        stock_screener_data = orjson.loads(file.read())
 # Convert stock_screener_data into a dictionary keyed by symbol
 stock_screener_data_dict = {item['symbol']: item for item in stock_screener_data}
 date, _ = GetStartEndDate().run()
 date = date.strftime('%Y-%m-%d')
 def save_as_json(data, filename):
    with open(f"json/industry/{filename}.json", 'w') as file:
        ujson.dump(data, file)
 def format_filename(industry_name):
    # Replace spaces with hyphens
    formatted_name = industry_name.replace(' ', '-')
@ -38,8 +28,46 @@ def format_filename(industry_name):
    return formatted_name.lower()
 date, _ = GetStartEndDate().run()
 date = date.strftime('%Y-%m-%d')
 def save_as_json(data, filename):
    with open(f"json/industry/{filename}.json", 'w') as file:
        ujson.dump(data, file)
 def remove_duplicates(data, key):
    seen = set()
    new_data = []
    for item in data:
        if item[key] not in seen:
            seen.add(item[key])
            new_data.append(item)
    return new_data
 async def historical_pe_ratio(session, class_type='sector'):
    # List to store the data
    historical_data = []
    # Starting point: today minus 180 days
    end_date = datetime.now()
    start_date = end_date - timedelta(days=180)
    # Iterate through each day
    current_date = start_date
    while current_date <= end_date:
        if current_date.weekday() < 5:  # Only fetch data for weekdays (Monday to Friday)
            date_str = current_date.strftime('%Y-%m-%d')
            data = await get_data(session, date_str, class_type)
            if data:
                historical_data+=data
        # Move to the next day
        current_date += timedelta(days=1)
    return historical_data
 # Function to fetch data from the API
-async def get_data(session, class_type='sector'):
+async def get_data(session, date, class_type='sector'):
    if class_type == 'sector':
        url = f"https://financialmodelingprep.com/api/v4/sector_price_earning_ratio?date={date}&exchange=NYSE&apikey={api_key}"
    else:
@ -69,11 +97,30 @@ def get_each_industry_data():
 async def run():
    async with aiohttp.ClientSession() as session:
        historical_pe_list = await historical_pe_ratio(session, class_type = 'industry')
        full_industry_list = get_each_industry_data()
        for industry, stocks in full_industry_list.items():
            filename = 'industries/'+format_filename(industry)
            stocks = sorted(stocks, key= lambda x: x['marketCap'], reverse=True)
-        save_as_json(stocks, filename)
+            history_list = []
            for item in historical_pe_list:
                try:
                    if item['industry'] == industry:
                        history_list.append({'date': item['date'], 'pe': round(float(item['pe']),2)})
                except:
                    pass
            history_list = sorted(history_list, key=lambda x: datetime.strptime(x['date'], '%Y-%m-%d'), reverse=False)
            history_list = remove_duplicates(history_list, 'date')
            res = {'name': industry, 'stocks': stocks, 'history': history_list}
            save_as_json(res, filename)
    # Initialize a dictionary to store stock count, market cap, and other totals for each industry
@ -150,7 +197,7 @@ async def run():
    # Assign the P/E values from pe_industry to the overview
    async with aiohttp.ClientSession() as session:
-        pe_industry = await get_data(session, class_type='industry')
+        pe_industry = await get_data(session, date, class_type='industry')
    for sector, industries in overview.items():
        for industry_data in industries:
            industry_name = industry_data['industry']
@ -216,7 +263,7 @@ async def run():
    # Assign the P/E values from pe_industry to the overview
    async with aiohttp.ClientSession() as session:
-        pe_sector = await get_data(session, class_type='sector')
+        pe_sector = await get_data(session, date, class_type='sector')
    # Loop through sector_overview to update P/E ratios from pe_sector
    for sector_data in sector_overview:
        sector_name = sector_data['sector']
--- a/app/main.py
+++ b/app/main.py
@ -3679,7 +3679,7 @@ async def get_sector_overview(data: TickerData, api_key: str = Security(get_api_
        with open(f"json/industry/industries/{ticker}.json", 'rb') as file:
            res = orjson.loads(file.read())
    except:
-        res = []
+        res = {}
    data = orjson.dumps(res)
    compressed_data = gzip.compress(data)
--- a/app/primary_cron_job.py
+++ b/app/primary_cron_job.py
@ -628,7 +628,7 @@ schedule.every(5).minutes.do(run_threaded, run_cron_market_movers).tag('market_m
 schedule.every(30).minutes.do(run_threaded, run_dividend_list).tag('dividend_list_job')
 schedule.every(15).minutes.do(run_threaded, run_cron_market_news).tag('market_news_job')
-schedule.every(15).minutes.do(run_threaded, run_cron_industry).tag('industry_job')
+schedule.every(30).minutes.do(run_threaded, run_cron_industry).tag('industry_job')
 schedule.every(10).minutes.do(run_threaded, run_one_day_price).tag('one_day_price_job')
 schedule.every(15).minutes.do(run_threaded, run_cron_heatmap).tag('heatmap_job')