diff --git a/ExpenseRatio.py b/ExpenseRatio.py index 7dcd0e0..3d14d05 100644 --- a/ExpenseRatio.py +++ b/ExpenseRatio.py @@ -8,12 +8,31 @@ Runs corrrelation study (I'm not sure if I want another class for this or not) ''' import numpy +#import urllib2, re +from urllib.request import urlopen +import re def main(): # For testing purposes - a = [1,4,6] - b = [1,2,3] + ''' + a = [1,2,3] + b = [2,4,6] c = numpy.corrcoef(a, b)[0, 1] print(c) + ''' + #http://finance.yahoo.com/q/pr?s=spy+profile + stockSymbols = [ "VDIGX", "VFIAX" ] + expenses = [ [ "Fund", "Most Recent Expense Ratio" ] ] + for stockSymbol in stockSymbols: + page = urlopen("http://finance.yahoo.com/q/pr?s=" + stockSymbol + "+profile" ) + data = str(page.read()) + row = re.findall("Annual Report Expense Ratio.*?", data) + if len(row) > 0: + ER = re.findall("(\d+\.\d+).*?", row[0] )[0] + expenses.append( [ stockSymbol, ER ] ) + else: + print(stockSymbol, "does not appear to be a fund with an expense ratio") + print("\n".join( i[0] + "," + i[1] for i in expenses)) + if __name__ == "__main__":