import numpy as np
import pandas as pd
import matplotlib.pyplot as plt
from zipline.pipeline.data import master  
from zipline.pipeline import Pipeline
from zipline.pipeline.data import USEquityPricing
from zipline.research import run_pipeline
from zipline.pipeline.data import sharadar  
from zipline.pipeline.factors import CustomFactor

revenue = sharadar.Fundamentals.slice(dimension='ARQ', period_offset=0).REVENUE.latest

pipe = Pipeline(
    columns={
        'Revenue': revenue
    },
    screen=revenue.top(500)
)
res = run_pipeline(pipe, start_date='2016-01-04', end_date='2016-01-04', bundle='usstock-1d-bundle')
print("There are %d assets in this universe." % len(res))

res.head(10) # print 10 constituents

There are 500 assets in this universe.

# Rename our universe to Lectures500
Lectures500 = revenue.top(500)

def get_sectors(day, universe, bundle):
    pipe = Pipeline(columns={'Sector': master.SecuritiesMaster.usstock_Sector.latest}, screen=universe)
    # Drop the datetime level of the index, since we only have one day of data 
    return run_pipeline(pipe, start_date=day, end_date=day, bundle=bundle).reset_index(level=0, drop=True)


def calculate_sector_counts(sectors):
    counts = (sectors.groupby('Sector').size())
    return counts

lectures500_sectors = get_sectors('2016-01-04', Lectures500, 'usstock-1d-bundle')
lectures500_counts = calculate_sector_counts(lectures500_sectors)

def plot_sector_counts(sector_counts):
    
    bar = plt.subplot2grid((10,12), (0,0), rowspan=10, colspan=6)
    pie = plt.subplot2grid((10,12), (0,6), rowspan=10, colspan=6)
    
    # Bar chart
    sector_counts.plot(
        kind='bar',
        color='b',
        rot=30,
        ax=bar,
    )
    
    bar.set_title('Sector Exposure - Counts')
    
    # Pie chart
    sector_counts.plot(
        kind='pie', 
        colormap='Set3', 
        autopct='%.2f %%',
        fontsize=12,
        ax=pie,
    )
    pie.set_ylabel('')  # This overwrites default ylabel, which is None :(
    pie.set_title('Sector Exposure - Proportions')
    
    plt.tight_layout();

plot_sector_counts(lectures500_counts)

res = run_pipeline(Pipeline(columns={'Lectures500' : Lectures500}), start_date='2015-01-01', end_date='2016-01-01', bundle='usstock-1d-bundle')
res = res.unstack().fillna(False).astype(int)

def calculate_daily_turnover(unstacked):
    return (unstacked
            .diff()        # Get 1/0 (True/False) showing where values changed from previous day.
            .abs()         # take absolute value so that any turnover is a 1
            .iloc[1:]      # Drop first row, which is meaningless after diff().
            .groupby(axis=1, level=0)  
            .sum())        # Group by universe and count number of 1 values in each row.

def plot_daily_turnover(unstacked):
    
    # Calculate locations where the inclusion state of an asset changed.
    turnover = calculate_daily_turnover(unstacked)
    
    # Write the data to an axis.
    ax = turnover.plot(figsize=(14, 8))
    
    # Add style to the axis.
    ax.grid(False)
    ax.set_title('Changes per Day')
    ax.set_ylabel('Number of Added or Removed Assets')
    

def print_daily_turnover_stats(unstacked):
    turnover = calculate_daily_turnover(unstacked)
    print(turnover.describe().loc[['mean', 'std', '25%', '50%', '75%', 'min', 'max']])

plot_daily_turnover(res)
print_daily_turnover_stats(res)

      Lectures500
mean     1.349206
std      2.432573
25%      0.000000
50%      0.000000
75%      2.000000
min      0.000000
max     18.000000

from zipline.pipeline.filters import AtLeastN

Lectures500 = AtLeastN(inputs=[Lectures500],
                       window_length=21,
                       N=16,)

res_smoothed = run_pipeline(Pipeline(columns={'Lectures500 Smoothed' : Lectures500}), 
                            start_date='2015-01-01',
                            end_date='2016-01-01',
                            bundle='usstock-1d-bundle')
res_smoothed = res_smoothed.unstack().fillna(False).astype(int)

plot_daily_turnover(res_smoothed)
print_daily_turnover_stats(res_smoothed)

      Lectures500 Smoothed
mean              0.944444
std               1.301581
25%               0.000000
50%               0.000000
75%               1.000000
min               0.000000
max               9.000000

		Revenue
2016-01-04 00:00:00+00:00	Equity(FIBBG005P7Q881 [AAL])	1.070600e+10
	Equity(FIBBG000F7RCJ1 [AAP])	2.295203e+09
	Equity(FIBBG000B9XRY4 [AAPL])	5.150100e+10
	Equity(FIBBG000DK5Q25 [ABB])	1.034600e+10
	Equity(FIBBG0025Y4RY4 [ABBV])	5.944000e+09
	Equity(FIBBG000MDCQC2 [ABC])	3.547038e+10
	Equity(FIBBG000BKDWB5 [ABG])	1.716400e+09
	Equity(FIBBG000B9ZXB4 [ABT])	5.150000e+09
	Equity(FIBBG000F61RJ8 [ACM])	4.723637e+09
	Equity(FIBBG000D9D830 [ACN])	8.465984e+09

Universe Selection¶

What is a Universe?¶

Lectures500¶

Sector Exposure¶

Turnover¶

Smoothing¶