Product_Customer.py

#-*- coding: utf-8 -*-
"""Which demographic factors
(e.g.  household size, presence of children, income) appear to affect customer spend?  Engagement with certain categories?
    => HH_DEMOGRAPHIC
Details : HOUSEHOLD_KEY, AGE_DESC[0], MARTIAL_STATUS_CODE[1], INCOME_DESC[2], HOMEOWNER_DESC,HH_COMP_DESC,HOUSEHOLD_SIZE_DESC[5],KID_CATEGORY_DESC[6]

1) Status
2) Age
3) HOMEOWNER_DESC -- Going to Salary
4) Household_key -->
(For each user:KidDiscription’ )
a) Dictionary which is having values KID_CATEGORY_DESC
b) Household Size
c) Income
5)

A:
    45-54:
        'Homeowner' :
                '7' :
                    'KID' = 0
                    'Size' = 2
                    'Income' = 50-74K


b) Segment more/Who are married/un-married. """


from collections import OrderedDict
import csv
import yaml
import sys

customerStatus = {}
productDictOverTime = {}

def readCSV():
    global customerStatus
    global productDictOverTime
    with open('/Users/Rick/Desktop/projectFinalFolder/segments/moreSpentOverTime.yaml', 'r' ) as f:
        moreSpentOverTime = yaml.load(f)
    f.close()

    with open('/Users/Rick/Desktop/projectFinalFolder/segments/customerMoreQuarterProductDictOverTime.yaml', 'r') as l:
        productDictOverTime = yaml.load(l)
    l.close()

    with open("/Users/Rick/Desktop/CSV/hh_demographic.csv", 'r') as f:
        data = csv.reader(f, delimiter=',')
        next(data)
        for row in data:
                if row[7] in moreSpentOverTime:
                    if row[7] in productDictOverTime:
                        if row[1] not in customerStatus:
                            customerStatus[row[1]] = {}
                            customerStatus[row[1]][row[0]] = {}
                            customerStatus[row[1]][row[0]][row[2]]={}
                            customerStatus[row[1]][row[0]][row[2]][row[4]] = {}
                            customerStatus[row[1]][row[0]][row[2]][row[4]][row[7]] = {}
                            customerStatus[row[1]][row[0]][row[2]][row[4]][row[7]][row[5]] =OrderedDict(sorted(productDictOverTime.items(), key=lambda x:x[1],reverse=True))
                        else:
                            if row[0] not in customerStatus[row[1]]:
                                customerStatus[row[1]][row[0]] = {}
                                customerStatus[row[1]][row[0]][row[2]]={}
                                customerStatus[row[1]][row[0]][row[2]][row[4]] = {}
                                customerStatus[row[1]][row[0]][row[2]][row[4]][row[7]] = {}
                                customerStatus[row[1]][row[0]][row[2]][row[4]][row[7]][row[5]] =OrderedDict(sorted(productDictOverTime.items(), key=lambda x:x[1],reverse=True))

                            else:
                                if row[2] not in customerStatus[row[1]][row[0]]:
                                    customerStatus[row[1]][row[0]][row[2]] = {}
                                    customerStatus[row[1]][row[0]][row[2]][row[4]] = {}
                                    customerStatus[row[1]][row[0]][row[2]][row[4]][row[7]] = {}
                                    customerStatus[row[1]][row[0]][row[2]][row[4]][row[7]][row[5]] = OrderedDict(sorted(productDictOverTime.items(), key=lambda x:x[1],reverse=True))

                                else:
                                    if row[4] not in customerStatus[row[1]][row[0]][row[2]]:
                                        customerStatus[row[1]][row[0]][row[2]][row[4]] = {}
                                        customerStatus[row[1]][row[0]][row[2]][row[4]][row[7]] = {}
                                        customerStatus[row[1]][row[0]][row[2]][row[4]][row[7]][row[5]] =OrderedDict(sorted(productDictOverTime.items(), key=lambda x:x[1],reverse=True))
                                    else:
                                        if row[7] not in customerStatus[row[1]][row[0]][row[2]][row[4]]:
                                            customerStatus[row[1]][row[0]][row[2]][row[4]][row[7]] = {}
                                            customerStatus[row[1]][row[0]][row[2]][row[4]][row[7]][row[5]] =OrderedDict(sorted(productDictOverTime.items(), key=lambda x:x[1],reverse=True))
                                        else:
                                            if row[5] not in customerStatus[row[1]][row[0]][row[2]][row[4]][row[7]]:
                                                customerStatus[row[1]][row[0]][row[2]][row[4]][row[7]][row[5]] =OrderedDict(sorted(productDictOverTime.items(), key=lambda x:x[1],reverse=True))

        print customerStatus
    f.close()

    with open("/Users/Rick/Desktop/productDictionarySorted.yaml", 'w') as f:
        f.write(yaml.dump(customerStatus,default_flow_style=False))
    f.close()

def main():
    readCSV()

if __name__=="__main__":
    main()