import aiohttp
import asyncio
import sqlite3
import json
import ujson
import pandas as pd
import os
from tqdm import tqdm
import pandas as pd
from datetime import datetime
from ta.utils import *
from ta.volatility import *
from ta.momentum import *
from ta.trend import *
from ta.volume import *
import warnings

from dotenv import load_dotenv
import os
load_dotenv()
api_key = os.getenv('FMP_API_KEY')

# Filter out the specific RuntimeWarning
warnings.filterwarnings("ignore", category=RuntimeWarning, message="invalid value encountered in scalar divide")


start_date = datetime(2015, 1, 1).strftime("%Y-%m-%d")
end_date = datetime.today().strftime("%Y-%m-%d")

quarter_date = '2024-6-30'


if os.path.exists("backup_db/stocks.db"):
    os.remove('backup_db/stocks.db')


def get_jsonparsed_data(data):
    try:
        return json.loads(data)
    except json.JSONDecodeError:
        return {}


class StockDatabase:
    def __init__(self, db_path):
        self.db_path = db_path
        self.conn = sqlite3.connect(db_path)
        self.cursor = self.conn.cursor()
        self.cursor.execute("PRAGMA journal_mode = wal")
        self.conn.commit()
        self._create_table()

    def close_connection(self):
        self.cursor.close()
        self.conn.close()

    def _create_table(self):
        self.cursor.execute("""
        CREATE TABLE IF NOT EXISTS stocks (
            symbol TEXT PRIMARY KEY,
            name TEXT,
            exchange TEXT,
            exchangeShortName TEXT,
            type TEXT
        )
        """)


    def get_column_type(self, value):
        column_type = ""

        if isinstance(value, str):
            column_type = "TEXT"
        elif isinstance(value, int):
            column_type = "INTEGER"
        elif isinstance(value, float):
            column_type = "REAL"
        else:
            # Handle other data types or customize based on your specific needs
            column_type = "TEXT"

        return column_type

    def remove_null(self, value):
        if isinstance(value, str) and value == None:
            value = 'n/a'
        elif isinstance(value, int) and value == None:
            value = 0
        elif isinstance(value, float) and value == None:
            value = 0
        else:
            # Handle other data types or customize based on your specific needs
            pass

        return value


    async def save_fundamental_data(self, session, symbol):
        try:
            urls = [
                f"https://financialmodelingprep.com/api/v3/profile/{symbol}?apikey={api_key}",
                f"https://financialmodelingprep.com/api/v3/quote/{symbol}?apikey={api_key}",
                f"https://financialmodelingprep.com/api/v3/income-statement/{symbol}?period=annual&apikey={api_key}",
                f"https://financialmodelingprep.com/api/v3/income-statement-growth/{symbol}?period=annual&apikey={api_key}",
                #f"https://financialmodelingprep.com/api/v4/esg-environmental-social-governance-data-ratings?symbol={symbol}&apikey={api_key}",
                #f"https://financialmodelingprep.com/api/v4/esg-environmental-social-governance-data?symbol={symbol}&apikey={api_key}",
                f"https://financialmodelingprep.com/api/v3/historical-price-full/stock_dividend/{symbol}?limit=400&apikey={api_key}",
                f"https://financialmodelingprep.com/api/v4/historical/employee_count?symbol={symbol}&apikey={api_key}",
                f"https://financialmodelingprep.com/api/v3/balance-sheet-statement/{symbol}?period=annual&apikey={api_key}",
                f"https://financialmodelingprep.com/api/v3/balance-sheet-statement-growth/{symbol}?period=annual&apikey={api_key}",
                f"https://financialmodelingprep.com/api/v3/cash-flow-statement/{symbol}?period=annual&apikey={api_key}",
                f"https://financialmodelingprep.com/api/v3/cash-flow-statement-growth/{symbol}?period=annual&apikey={api_key}",
                f"https://financialmodelingprep.com/api/v3/ratios/{symbol}?period=annual&apikey={api_key}",
                f"https://financialmodelingprep.com/api/v3/historical-price-full/stock_split/{symbol}?apikey={api_key}",
                f"https://financialmodelingprep.com/api/v4/stock_peers?symbol={symbol}&apikey={api_key}",
                f"https://financialmodelingprep.com/api/v4/institutional-ownership/institutional-holders/symbol-ownership-percent?date={quarter_date}&symbol={symbol}&page=0&apikey={api_key}",
                f"https://financialmodelingprep.com/api/v4/historical/shares_float?symbol={symbol}&apikey={api_key}",
                f"https://financialmodelingprep.com/api/v4/revenue-product-segmentation?symbol={symbol}&structure=flat&period=annual&apikey={api_key}",
                f"https://financialmodelingprep.com/api/v4/revenue-geographic-segmentation?symbol={symbol}&structure=flat&apikey={api_key}",
                f"https://financialmodelingprep.com/api/v3/analyst-estimates/{symbol}?apikey={api_key}",
            ]

            fundamental_data = {}

            # Check if 'income' and 'income_growth' data already exist for the symbol
            try:
                self.cursor.execute("SELECT income, income_growth, balance, balance_growth, cashflow, cashflow_growth, ratios, stock_peers FROM stocks WHERE symbol = ?", (symbol,))
                existing_data = self.cursor.fetchone()
                income_exists = existing_data and existing_data[0] is not None
                income_growth_exists = existing_data and existing_data[1] is not None
                balance_exists = existing_data and existing_data[0] is not None
                balance_growth_exists = existing_data and existing_data[1] is not None
                cashflow_exists = existing_data and existing_data[0] is not None
                cashflow_growth_exists = existing_data and existing_data[1] is not None
                ratios_exists = existing_data and existing_data[1] is not None
                stock_peers_exists = existing_data and existing_data[0] is not None
                esg_data_exists = existing_data and existing_data[0] is not None
                esg_ratings_exists = existing_data and existing_data[0] is not None
            except:
                income_exists = False
                income_growth_exists = False
                balance_exists = False
                balance_growth_exists = False
                cashflow_exists = False
                cashflow_growth_exists = False
                ratios_exists = False
                stock_peers_exists = False
                esg_data_exists = False
                esg_ratings_exists = False

            for url in urls:

                # Skip the API calls if the data already exists
                if 'income-statement/' in url and income_exists:
                    print(f"Skipping income-statement for {symbol} as it already exists.")
                    continue
                elif 'income-statement-growth/' in url and income_growth_exists:
                    print(f"Skipping income-statement-growth for {symbol} as it already exists.")
                    continue
                elif 'balance-sheet-statement/' in url and balance_exists:
                    print(f"Skipping balance-statement for {symbol} as it already exists.")
                    continue
                elif 'balance-sheet-statement-growth/' in url and balance_growth_exists:
                    print(f"Skipping balance-statement-growth for {symbol} as it already exists.")
                    continue
                elif 'cash-flow-statement/' in url and cashflow_exists:
                    print(f"Skipping cashflow-statement for {symbol} as it already exists.")
                    continue
                elif 'cash-flow-statement-growth/' in url and cashflow_growth_exists:
                    print(f"Skipping cashflow-statement-growth for {symbol} as it already exists.")
                    continue
                elif '/v3/ratios/' in url and ratios_exists:
                    print(f"Skipping ratios for {symbol} as it already exists.")
                    continue
                
                elif 'stock_peers/' in url and stock_peers_exists:
                    print(f"Skipping stock_peers for {symbol} as it already exists.")
                    continue


                async with session.get(url) as response:
                    data = await response.text()
                    parsed_data = get_jsonparsed_data(data)

                    try:
                        if isinstance(parsed_data, list) and "profile" in url:
                            # Handle list response, save as JSON object
                            fundamental_data['profile'] = ujson.dumps(parsed_data)
                            data_dict = {
                                        'beta': parsed_data[0]['beta'],
                                        'country': parsed_data[0]['country'],
                                        'sector': parsed_data[0]['sector'],
                                        'industry': parsed_data[0]['industry'],
                                        'discounted_cash_flow': round(parsed_data[0]['dcf'],2),
                                        }
                            fundamental_data.update(data_dict)

                        elif isinstance(parsed_data, list) and "quote" in url:
                            # Handle list response, save as JSON object
                            fundamental_data['quote'] = ujson.dumps(parsed_data)
                            data_dict = {
                                        'price': parsed_data[0]['price'],
                                        'changesPercentage': round(parsed_data[0]['changesPercentage'],2),
                                        'marketCap': parsed_data[0]['marketCap'],
                                        'volume': parsed_data[0]['volume'],
                                        'avgVolume': parsed_data[0]['avgVolume'],
                                        'eps': parsed_data[0]['eps'],
                                        'pe': parsed_data[0]['pe'],
                                        }
                            fundamental_data.update(data_dict)

                        elif isinstance(parsed_data, list) and "income-statement/" in url:
                            # Handle list response, save as JSON object
                            fundamental_data['income'] = ujson.dumps(parsed_data)
                            data_dict = {'revenue': parsed_data[0]['revenue'],
                                        'netIncome': parsed_data[0]['netIncome'],
                                        'grossProfit': parsed_data[0]['grossProfit'],
                                        'costOfRevenue':parsed_data[0]['costOfRevenue'],
                                        'costAndExpenses':parsed_data[0]['costAndExpenses'],
                                        'interestIncome':parsed_data[0]['interestIncome'],
                                        'interestExpense':parsed_data[0]['interestExpense'],
                                        'researchAndDevelopmentExpenses':parsed_data[0]['researchAndDevelopmentExpenses'],
                                        'ebitda':parsed_data[0]['ebitda'],
                                        'ebitdaratio':parsed_data[0]['ebitdaratio'],
                                        'depreciationAndAmortization':parsed_data[0]['depreciationAndAmortization'],
                                        'operatingIncome':parsed_data[0]['operatingIncome'],
                                        'operatingExpenses':parsed_data[0]['operatingExpenses']
                                        }
                            fundamental_data.update(data_dict)
                        elif isinstance(parsed_data, list) and "/v3/ratios/" in url:
                            fundamental_data['ratios'] = ujson.dumps(parsed_data)
                            data_dict = {'payoutRatio': parsed_data[0]['payoutRatio'],
                                        'priceToBookRatio': parsed_data[0]['priceToBookRatio'],
                                        'dividendPayoutRatio': parsed_data[0]['dividendPayoutRatio'],
                                        'priceToSalesRatio':parsed_data[0]['priceToSalesRatio'],
                                        'priceEarningsRatio':parsed_data[0]['priceEarningsRatio'],
                                        'priceCashFlowRatio':parsed_data[0]['priceCashFlowRatio'],
                                        'priceSalesRatio':parsed_data[0]['priceSalesRatio'],
                                        'dividendYield':parsed_data[0]['dividendYield'],
                                        'cashFlowToDebtRatio':parsed_data[0]['cashFlowToDebtRatio'],
                                        'freeCashFlowPerShare':parsed_data[0]['freeCashFlowPerShare'],
                                        'cashPerShare':parsed_data[0]['cashPerShare'],
                                        }
                            fundamental_data.update(data_dict)

                        elif isinstance(parsed_data, list) and "balance-sheet-statement/" in url:
                            # Handle list response, save as JSON object
                            fundamental_data['balance'] = ujson.dumps(parsed_data)
                        elif isinstance(parsed_data, list) and "cash-flow-statement/" in url:
                            # Handle list response, save as JSON object
                            fundamental_data['cashflow'] = ujson.dumps(parsed_data)

                        elif isinstance(parsed_data, list) and "sector-benchmark" in url:
                            # Handle list response, save as JSON object
                            fundamental_data['esg_sector_benchmark'] = ujson.dumps(parsed_data)
                        elif isinstance(parsed_data, list) and "income-statement-growth/" in url:
                            # Handle list response, save as JSON object
                            fundamental_data['income_growth'] = ujson.dumps(parsed_data)
                            data_dict = {'growthRevenue': parsed_data[0]['growthRevenue']*100,
                                        'growthNetIncome': parsed_data[0]['growthNetIncome']*100,
                                        'growthGrossProfit': parsed_data[0]['growthGrossProfit']*100,
                                        'growthCostOfRevenue':parsed_data[0]['growthCostOfRevenue']*100,
                                        'growthCostAndExpenses':parsed_data[0]['growthCostAndExpenses']*100,
                                        'growthInterestExpense':parsed_data[0]['growthInterestExpense']*100,
                                        'growthResearchAndDevelopmentExpenses':parsed_data[0]['growthResearchAndDevelopmentExpenses']*100,
                                        'growthEBITDA':parsed_data[0]['growthEBITDA']*100,
                                        'growthEBITDARatio':parsed_data[0]['growthEBITDARatio']*100,
                                        'growthDepreciationAndAmortization':parsed_data[0]['growthDepreciationAndAmortization']*100,
                                        'growthEPS':parsed_data[0]['growthEPS']*100,
                                        'growthOperatingIncome':parsed_data[0]['growthOperatingIncome']*100,
                                        'growthOperatingExpenses':parsed_data[0]['growthOperatingExpenses']*100
                                        }

                            fundamental_data.update(data_dict)
                        elif isinstance(parsed_data, list) and "balance-sheet-statement-growth/" in url:
                            # Handle list response, save as JSON object
                            fundamental_data['balance_growth'] = ujson.dumps(parsed_data)
                        elif isinstance(parsed_data, list) and "cash-flow-statement-growth/" in url:
                            # Handle list response, save as JSON object
                            fundamental_data['cashflow_growth'] = ujson.dumps(parsed_data)
                       
                        elif "stock_dividend" in url:
                            # Handle list response, save as JSON object
                            fundamental_data['stock_dividend'] = ujson.dumps(parsed_data)
                        elif "employee_count" in url:
                            # Handle list response, save as JSON object
                            fundamental_data['history_employee_count'] = ujson.dumps(parsed_data)
                        elif "stock_split" in url:
                            # Handle list response, save as JSON object
                            fundamental_data['stock_split'] = ujson.dumps(parsed_data['historical'])
                        elif "stock_peers" in url:
                            # Handle list response, save as JSON object
                            fundamental_data['stock_peers'] = ujson.dumps([item for item in parsed_data[0]['peersList'] if item != ""])
                        elif "institutional-ownership/institutional-holders" in url:
                            # Handle list response, save as JSON object
                            fundamental_data['shareholders'] = ujson.dumps(parsed_data)
                        elif "historical/shares_float" in url:
                            # Handle list response, save as JSON object
                            fundamental_data['historicalShares'] = ujson.dumps(parsed_data)
                        elif "revenue-product-segmentation" in url:
                            # Handle list response, save as JSON object
                            fundamental_data['revenue_product_segmentation'] = ujson.dumps(parsed_data)
                        elif "revenue-geographic-segmentation" in url:
                            # Handle list response, save as JSON object
                            fundamental_data['revenue_geographic_segmentation'] = ujson.dumps(parsed_data)
                        elif "analyst-estimates" in url:
                            # Handle list response, save as JSON object
                            fundamental_data['analyst_estimates'] = ujson.dumps(parsed_data)
                    except:
                        pass


            # Check if columns already exist in the table
            self.cursor.execute("PRAGMA table_info(stocks)")
            columns = {column[1]: column[2] for column in self.cursor.fetchall()}

            # Update column definitions with keys from fundamental_data
            column_definitions = {
                key: (self.get_column_type(fundamental_data.get(key, None)), self.remove_null(fundamental_data.get(key, None)))
                for key in fundamental_data
            }


            for column, (column_type, value) in column_definitions.items():
                if column not in columns and column_type:
                    self.cursor.execute(f"ALTER TABLE stocks ADD COLUMN {column} {column_type}")

                self.cursor.execute(f"UPDATE stocks SET {column} = ? WHERE symbol = ?", (value, symbol))

            self.conn.commit()

        except Exception as e:
            print(f"Failed to fetch fundamental data for symbol {symbol}: {str(e)}")


    async def save_stocks(self, stocks):
        symbols = []
        names = []
        ticker_data = []

        for stock in stocks:
            exchange_short_name = stock.get('exchangeShortName', '')
            ticker_type = stock.get('type', '')
            if exchange_short_name in ['XETRA','NYSE', 'NASDAQ','AMEX', 'PNK','EURONEXT'] and ticker_type in ['stock']:
                symbol = stock.get('symbol', '')
                if exchange_short_name == 'PNK' and symbol not in ['DRSHF','NTDOY','OTGLF','TCEHY', 'KRKNF','BYDDY','XIACY','NSRGY']:
                    pass
                elif exchange_short_name == 'EURONEXT' and symbol not in ['ALEUP.PA','ALNEV.PA','ALGAU.PA','ALDRV.PA','ALHYG.PA','ALVMG.PA']:
                    pass
                else:
                    name = stock.get('name', '')
                    exchange = stock.get('exchange', '')

                    #if name and '-' not in symbol:
                    if name:
                        symbols.append(symbol)
                        names.append(name)

                        ticker_data.append((symbol, name, exchange, exchange_short_name, ticker_type))
        

        self.cursor.execute("BEGIN TRANSACTION")  # Begin a transaction

        for data in ticker_data:
            symbol, name, exchange, exchange_short_name, ticker_type = data

            # Check if the symbol already exists
            self.cursor.execute("SELECT symbol FROM stocks WHERE symbol = ?", (symbol,))
            exists = self.cursor.fetchone()

            # If it doesn't exist, insert it
            if not exists:
                self.cursor.execute("""
                INSERT INTO stocks (symbol, name, exchange, exchangeShortName, type)
                VALUES (?, ?, ?, ?, ?)
                """, (symbol, name, exchange, exchange_short_name, ticker_type))

            # Update the existing row
            else:
                self.cursor.execute("""
                UPDATE stocks SET name = ?, exchange = ?, exchangeShortName = ?, type = ?
                WHERE symbol = ?
                """, (name, exchange, exchange_short_name, ticker_type, symbol))

        self.conn.commit()

        # Save OHLC data for each ticker using aiohttp
        async with aiohttp.ClientSession() as session:
            tasks = []
            i = 0
            for stock_data in tqdm(ticker_data):
                symbol, name, exchange, exchange_short_name, ticker_type = stock_data
                #symbol = symbol.replace("-", "")  # Remove "-" from symbol
                tasks.append(self.save_ohlc_data(session, symbol))
                tasks.append(self.save_fundamental_data(session, symbol))

                i += 1
                if i % 60 == 0:
                    await asyncio.gather(*tasks)
                    tasks = []
                    print('sleeping mode: ', i)
                    await asyncio.sleep(60)  # Pause for 60 seconds

            
            if tasks:
                await asyncio.gather(*tasks)


    def _create_ticker_table(self, symbol):
        cleaned_symbol = symbol  # Ensure this is a safe string to use as a table name
        self.cursor.execute(f"""
            CREATE TABLE IF NOT EXISTS '{cleaned_symbol}' (
                date TEXT UNIQUE,
                open FLOAT,
                high FLOAT,
                low FLOAT,
                close FLOAT,
                volume INT,
                change_percent FLOAT
            );
        """)
        self.conn.commit()

    async def save_ohlc_data(self, session, symbol):
        try:
            self._create_ticker_table(symbol)  # Ensure the table exists

            # Fetch OHLC data from the API
            url = f"https://financialmodelingprep.com/api/v3/historical-price-full/{symbol}?serietype=bar&from={start_date}&to={end_date}&apikey={api_key}"
            async with session.get(url) as response:
                data = await response.text()
            
            ohlc_data = get_jsonparsed_data(data)
            if 'historical' in ohlc_data:
                historical_data = ohlc_data['historical'][::-1]

                for entry in historical_data:
                    # Prepare the data for each entry
                    date = entry.get('date')
                    open_price = entry.get('open')
                    high = entry.get('high')
                    low = entry.get('low')
                    close = entry.get('close')
                    volume = entry.get('volume')
                    change_percent = entry.get('changePercent')

                    # Check if this date's data already exists
                    self.cursor.execute(f"SELECT date FROM '{symbol}' WHERE date = ?", (date,))
                    exists = self.cursor.fetchone()

                    # If it doesn't exist, insert the new data
                    if not exists:
                        self.cursor.execute(f"""
                            INSERT INTO '{symbol}' (date, open, high, low, close, volume, change_percent)
                            VALUES (?, ?, ?, ?, ?, ?, ?)
                        """, (date, open_price, high, low, close, volume, change_percent))
                
                # Commit all changes to the database
                self.conn.commit()

        except Exception as e:
            print(f"Failed to fetch or insert OHLC data for symbol {symbol}: {str(e)}")


url = f"https://financialmodelingprep.com/api/v3/available-traded/list?apikey={api_key}"


async def fetch_tickers():
    async with aiohttp.ClientSession() as session:
        async with session.get(url) as response:
            data = await response.text()
            return get_jsonparsed_data(data)


db = StockDatabase('backup_db/stocks.db')
loop = asyncio.get_event_loop()
all_tickers = loop.run_until_complete(fetch_tickers())
#all_tickers = [item for item in all_tickers if item['symbol'] == 'KRKNF']
'''
existing_names = set()

filtered_data = []
for item in all_tickers:
    if '.' not in item['symbol'] and item['name'] not in existing_names:
        filtered_data.append(item)
        existing_names.add(item['name'])

print(len(filtered_data))

for item in filtered_data:
    if 'RHM.DE' in item['symbol']:
        print(item)

time.sleep(1000)
'''

loop.run_until_complete(db.save_stocks(all_tickers))
db.close_connection()