update metrics

2024-10-22 22:35:10 +02:00 · 2024-10-22 22:35:10 +02:00 · d03b7a58ee
commit d03b7a58ee
parent 0a2698509a
2 changed files with 29 additions and 27 deletions
--- a/app/cron_analyst_db.py
+++ b/app/cron_analyst_db.py
@ -52,10 +52,10 @@ def extract_sector(ticker, con):
        symbol = ?
    """
    try:
-    	df = pd.read_sql_query(query_template, con, params=(ticker,))
+        df = pd.read_sql_query(query_template, con, params=(ticker,))
-    	sector = df['sector'].iloc[0]
+        sector = df['sector'].iloc[0]
    except:
-    	sector = None
+        sector = None
    return sector
--- a/app/cron_business_metrics.py
+++ b/app/cron_business_metrics.py
@ -6,6 +6,7 @@ from datetime import datetime
 from collections import defaultdict
 import re
 #Tell the SEC who you are
 set_identity("Max Mustermann max.mustermann@indigo.com")
@ -370,12 +371,11 @@ def generate_revenue_dataset(dataset):
    return final_result
 def run(symbol):
 def process_filings(filings, symbol):
    revenue_sources = []
    geography_sources = []
    filings = Company(symbol).get_filings(form=["10-Q","10-K"]).latest(20)
    #print(filings[0].xbrl())
    for i in range(0,17):
        try:
@ -383,7 +383,6 @@ def run(symbol):
            facts = filing_xbrl.facts.data
            latest_rows = facts.groupby('dimensions').head(1)
            for index, row in latest_rows.iterrows():
                dimensions_str = row.get("dimensions", "{}")
                try:
@ -391,21 +390,19 @@ def run(symbol):
                except (ValueError, SyntaxError):
                    dimensions_dict = {}
                for column_name in [
                    "srt:StatementGeographicalAxis",
                    "us-gaap:StatementBusinessSegmentsAxis",
                    "srt:ProductOrServiceAxis",
                ]:
                    product_dimension = dimensions_dict.get(column_name) if isinstance(dimensions_dict, dict) else None
-                    # Check if the namespace is 'us-gaap' and product_dimension is valid
+                    
                    if row["namespace"] == "us-gaap" and product_dimension is not None and (
                        product_dimension.startswith(symbol.lower() + ":") or 
                        product_dimension.startswith("country" + ":") or
                        product_dimension.startswith("us-gaap"+":") or
                        product_dimension.startswith("srt"+":")
                    ):
                        replacements = {
                            "Member": "",
                            "VideoGameAccessories": "HardwareAndAccessories",
@ -416,39 +413,44 @@ def run(symbol):
                            "srt:": "",
                            "SegmentMember": "",
                        }
                        name = product_dimension
                        for old, new in replacements.items():
                            name = name.replace(old, new)
-                        # Determine the target list and the name transformation logic
+                            
                        if symbol in ['SAVE','BA','NFLX','LLY','MSFT','META','NVDA','AAPL','GME']:
                            column_list = ["srt:ProductOrServiceAxis"]
                        else:
                            column_list = ["srt:ProductOrServiceAxis", "us-gaap:StatementBusinessSegmentsAxis"]
                        if column_name in column_list:
                            revenue_sources.append({"name": name, "value": row["value"], "date": row["end_date"]})
                        else:
                            geography_sources.append({"name": name, "value": row["value"], "date": row["end_date"]})
        except Exception as e:
            print(e)
    return revenue_sources, geography_sources
 def run(symbol):
    # First try with 10-Q filings only
    filings = Company(symbol).get_filings(form=["10-Q"]).latest(20)
    revenue_sources, geography_sources = process_filings(filings, symbol)
    # If no geography sources found, try with 10-K filings
    if not geography_sources:
        print(f"No geography sources found in 10-Q for {symbol}, checking 10-K filings...")
        filings_10k = Company(symbol).get_filings(form=["10-K"]).latest(20)
        _, geography_sources = process_filings(filings_10k, symbol)
    print(geography_sources)
    revenue_dataset = generate_revenue_dataset(revenue_sources)
    geographic_dataset = generate_geography_dataset(geography_sources)
    final_dataset = {'revenue': revenue_dataset, 'geographic': geographic_dataset}
    with open(f"json/business-metrics/{symbol}.json", "w") as file:
        ujson.dump(final_dataset, file)
 if __name__ == "__main__":
-
+    for symbol in ['AMD','SAVE','BA','ADBE','NFLX','PLTR','MSFT','META','TSLA','NVDA','AAPL','GME']:
    for symbol in []: #['SAVE','BA','ADBE','NFLX','PLTR','MSFT','META','TSLA','NVDA','AAPL','GME']:
        #for AMD, SAVE we need 10-K form to get geography revenue
        run(symbol)