Identifying price swings/trends in pandas dataframe with stock quotes

Question 1

It's a bit tricky since you cannot mark a point as pivot until you find the next potential pivot (ie if you are in an upward trend, you can't say it's done until you find a low sufficiently low).

This code does the trick - I've put your data in the tmpData.txt file for convenience, and get the desired result. Please check

def get_pivots():
    data = pd.DataFrame.from_csv('tmpData.txt')
    data['swings'] = np.nan

    pivot = data.irow(0).open
    last_pivot_id = 0
    up_down = 0

    diff = .3

    for i in range(0, len(data)):
        row = data.irow(i)

        # We don't have a trend yet
        if up_down == 0:
            if row.low < pivot - diff:
                data.ix[i, 'swings'] = row.low - pivot
                pivot, last_pivot_id = row.low, i
                up_down = -1
            elif row.high > pivot + diff:
                data.ix[i, 'swings'] = row.high - pivot
                pivot, last_pivot_id = row.high, i
                up_down = 1

        # Current trend is up
        elif up_down == 1:
            # If got higher than last pivot, update the swing
            if row.high > pivot:
                # Remove the last pivot, as it wasn't a real one
                data.ix[i, 'swings'] = data.ix[last_pivot_id, 'swings'] + (row.high - data.ix[last_pivot_id, 'high'])
                data.ix[last_pivot_id, 'swings'] = np.nan
                pivot, last_pivot_id = row.high, i
            elif row.low < pivot - diff:
                data.ix[i, 'swings'] = row.low - pivot
                pivot, last_pivot_id = row.low, i
                # Change the trend indicator
                up_down = -1

        # Current trend is down
        elif up_down == -1:
             # If got lower than last pivot, update the swing
            if row.low < pivot:
                # Remove the last pivot, as it wasn't a real one
                data.ix[i, 'swings'] = data.ix[last_pivot_id, 'swings'] + (row.low - data.ix[last_pivot_id, 'low'])
                data.ix[last_pivot_id, 'swings'] = np.nan
                pivot, last_pivot_id = row.low, i
            elif row.high > pivot - diff:
                data.ix[i, 'swings'] = row.high - pivot
                pivot, last_pivot_id = row.high, i
                # Change the trend indicator
                up_down = 1

    print data

Output:

date                  close  high    low     open    volume    swings                                            
2014-05-09 13:30:00  187.56  187.73  187.54  187.70  1922600     NaN
2014-05-09 13:31:00  187.49  187.56  187.42  187.55   534400     NaN
2014-05-09 13:32:00  187.42  187.51  187.35  187.49   224800   -0.35
2014-05-09 13:33:00  187.55  187.58  187.39  187.40   303700     NaN
2014-05-09 13:34:00  187.67  187.67  187.53  187.56   438200     NaN
2014-05-09 13:35:00  187.60  187.71  187.56  187.68   296400    0.36
2014-05-09 13:36:00  187.41  187.67  187.38  187.60   329900     NaN
2014-05-09 13:37:00  187.31  187.44  187.28  187.40   404000     NaN
2014-05-09 13:38:00  187.26  187.37  187.26  187.30   912800     NaN
2014-05-09 13:39:00  187.22  187.28  187.12  187.25   607700   -0.59

Question 2

Updated the code of tw0000 as he had a little bug on the lines with 'O' instead of cols[0]

def get_pivots(df, cols=['O','H','L', 'C']):

  df['swings'] = np.nan
  df.loc[df.index[0], 'swings'] = df.loc[df.index[0], cols[0]]
  df.loc[df.index[-1], 'swings'] = df.loc[df.index[-1], cols[0]]

  pivot = df.loc[df.index[0], cols[0]]
  df.loc[df.index[0], ]
  last_pivot_id = 0
  up_down = 0

  diff = .3

  for i, row in df.iterrows():

      # We don't have a trend yet
      if up_down == 0:
          if row[cols[2]] < pivot - diff:
              df.loc[i, 'swings'] = row[cols[2]] - pivot
              pivot, last_pivot_id = row[cols[2]], i
              up_down = -1
          elif row[cols[1]] > pivot + diff:
              df.loc[i, 'swings'] = row[cols[1]] - pivot
              pivot, last_pivot_id = row[cols[1]], i
              up_down = 1

      # Current trend is up
      elif up_down == 1:
          # If got higher than last pivot, update the swing
          if row[cols[1]] > pivot:
              # Remove the last pivot, as it wasn't a real one
              df.loc[i, 'swings'] = df.loc[i, 'swings']
              df.loc[last_pivot_id, 'swings'] = np.nan
              pivot, last_pivot_id = row[cols[1]], i
          elif row[cols[2]] < pivot - diff:
              df.loc[i, 'swings'] = row[cols[2]] - pivot
              pivot, last_pivot_id = row[cols[2]], i
              # Change the trend indicator
              up_down = -1

Question 3

how about, assuming you only care about highs for the moment:

startPx = df.open.iloc[0]
level = ((df.high - startPx) / .3).astype(int)
df['swings'] = level - level.shift(1)

now, to find out what the differences are, you would just do something like:

changes = df[df.swings != 0]
diffs = changes.high - changes.open.shift(1)

Question 4

so i haven't tested this, but something like this will get you what you want. what happens if both the low < pivot - diff and high > pivot + diff in the same minute?

def f(df):
    pivot = df.open.iloc[0]
    diff = .3
    def proc(ser):
        res = np.nan
        if ser.low < pivot - diff:
            res, pivot = ser.low - pivot, ser.low
        elif ser.high > pivot + diff:
            res, pivot = ser.high - pivot, ser.high
        return res

    df['swings'] = df.apply(proc, axis=1)

Question 5

I updated the answer from @Pawel-Kozela to be compatible with the latest version of pandas, and added an easy way to pass column names.

def get_pivots(df, cols=['O','H','L', 'C']):

    df['swings'] = np.nan
    df.loc[df.index[0], 'swings'] = df.loc[df.index[0], cols[0]]
    df.loc[df.index[-1], 'swings'] = df.loc[df.index[-1], cols[0]]

    pivot = df.loc[df.index[0], cols[0]]
    df.loc[df.index[0], ]
    last_pivot_id = 0
    up_down = 0

    diff = .3

    for i, row in df.iterrows():

        # We don't have a trend yet
        if up_down == 0:
            if row[cols[2]] < pivot - diff:
                df.loc[i, 'swings'] = row[cols[2]] - pivot
                pivot, last_pivot_id = row[cols[2]], i
                up_down = -1
            elif row[cols[1]] > pivot + diff:
                df.loc[i, 'swings'] = row[cols[1]] - pivot
                pivot, last_pivot_id = row[cols[1]], i
                up_down = 1

        # Current trend is up
        elif up_down == 1:
            # If got higher than last pivot, update the swing
            if row[cols[1]] > pivot:
                # Remove the last pivot, as it wasn't a real one
                df.loc[i, 'swings'] = df.loc[i, 'swings']
                df.loc[last_pivot_id, 'swings'] = np.nan
                pivot, last_pivot_id = row[cols[1]], i
            elif row[cols[2]] < pivot - diff:
                df.loc[i, 'swings'] = row[cols[2]] - pivot
                pivot, last_pivot_id = row[cols[2]], i
                # Change the trend indicator
                up_down = -1