Copied!







import copper
copper.project.path = '../'

import copper
copper.project.path = '../'





Copied!







import copper
copper.project.path = '../'

import copper
copper.project.path = '../'





Copied!







ds = copper.Dataset()

ds = copper.Dataset()





Copied!







ds = copper.Dataset()

ds = copper.Dataset()





Copied!







ds.load('data.csv')

ds.load('data.csv')





Copied!







ds.load('data.csv')

ds.load('data.csv')





Copied!







ds.metadata

ds.metadata





Copied!







ds.metadata

ds.metadata





Copied!







ds.role['TARGET_D'] = ds.REJECTED
ds.role['TARGET_B'] = ds.TARGET
ds.type['ID'] = ds.CATEGORY

ds.role['TARGET_D'] = ds.REJECTED
ds.role['TARGET_B'] = ds.TARGET
ds.type['ID'] = ds.CATEGORY





Copied!







ds.role['TARGET_D'] = ds.REJECTED
ds.role['TARGET_B'] = ds.TARGET
ds.type['ID'] = ds.CATEGORY

ds.role['TARGET_D'] = ds.REJECTED
ds.role['TARGET_B'] = ds.TARGET
ds.type['ID'] = ds.CATEGORY





Copied!







ds.metadata.head(3)

ds.metadata.head(3)





Copied!







ds.metadata.head(3)

ds.metadata.head(3)





Copied!







ds.histogram('DemMedIncome', legend=False, retList=True)

ds.histogram('DemMedIncome', legend=False, retList=True)

0          0.0 - 10000.05: 2358
1         10000.0 - 20000.10: 9
2       20000.1 - 30000.15: 304
3      30000.1 - 40000.20: 1397
4      40000.2 - 50000.25: 2187
5      50000.2 - 60000.30: 1303
6       60000.3 - 70000.35: 921
7       70000.3 - 80000.40: 550
8       80000.4 - 90000.45: 290
9      90000.4 - 100000.50: 130
10    100000.5 - 110000.55: 110
11     110000.5 - 120000.60: 39
12     120000.6 - 130000.65: 34
13     130000.6 - 140000.70: 18
14      140000.7 - 150000.75: 7
15     150000.8 - 160000.80: 13
16      160000.8 - 170000.85: 7
17      170000.8 - 180000.90: 7
18      180000.9 - 190000.95: 0
19      190000.9 - 200001.00: 2





Copied!







ds.histogram('DemMedIncome', legend=False, retList=True)

ds.histogram('DemMedIncome', legend=False, retList=True)

0          0.0 - 10000.05: 2358
1         10000.0 - 20000.10: 9
2       20000.1 - 30000.15: 304
3      30000.1 - 40000.20: 1397
4      40000.2 - 50000.25: 2187
5      50000.2 - 60000.30: 1303
6       60000.3 - 70000.35: 921
7       70000.3 - 80000.40: 550
8       80000.4 - 90000.45: 290
9      90000.4 - 100000.50: 130
10    100000.5 - 110000.55: 110
11     110000.5 - 120000.60: 39
12     120000.6 - 130000.65: 34
13     130000.6 - 140000.70: 18
14      140000.7 - 150000.75: 7
15     150000.8 - 160000.80: 13
16      160000.8 - 170000.85: 7
17      170000.8 - 180000.90: 7
18      180000.9 - 190000.95: 0
19      190000.9 - 200001.00: 2





Copied!







ds.histogram('DemGender')

ds.histogram('DemGender')





Copied!







ds.histogram('DemGender')

ds.histogram('DemGender')





Copied!







ds.inputs

ds.inputs

<class 'pandas.core.frame.DataFrame'>
Int64Index: 9686 entries, 0 to 9685
Data columns:
GiftCnt36            9686  non-null values
GiftCntAll           9686  non-null values
GiftCntCard36        9686  non-null values
GiftCntCardAll       9686  non-null values
GiftAvgLast          9686  non-null values
GiftAvg36            9686  non-null values
GiftAvgAll           9686  non-null values
GiftAvgCard36        7906  non-null values
GiftTimeLast         9686  non-null values
GiftTimeFirst        9686  non-null values
PromCnt12            9686  non-null values
PromCnt36            9686  non-null values
PromCntAll           9686  non-null values
PromCntCard12        9686  non-null values
PromCntCard36        9686  non-null values
PromCntCardAll       9686  non-null values
StatusCat96NK [A]    9686  non-null values
StatusCat96NK [E]    9686  non-null values
StatusCat96NK [F]    9686  non-null values
StatusCat96NK [L]    9686  non-null values
StatusCat96NK [N]    9686  non-null values
StatusCat96NK [S]    9686  non-null values
StatusCatStarAll     9686  non-null values
DemCluster           9686  non-null values
DemAge               7279  non-null values
DemGender [F]        9686  non-null values
DemGender [M]        9686  non-null values
DemGender [U]        9686  non-null values
DemHomeOwner [H]     9686  non-null values
DemHomeOwner [U]     9686  non-null values
DemMedHomeValue      9686  non-null values
DemPctVeterans       9686  non-null values
DemMedIncome         9686  non-null values
dtypes: float64(7), int64(26)





Copied!







ds.inputs

ds.inputs

<class 'pandas.core.frame.DataFrame'>
Int64Index: 9686 entries, 0 to 9685
Data columns:
GiftCnt36            9686  non-null values
GiftCntAll           9686  non-null values
GiftCntCard36        9686  non-null values
GiftCntCardAll       9686  non-null values
GiftAvgLast          9686  non-null values
GiftAvg36            9686  non-null values
GiftAvgAll           9686  non-null values
GiftAvgCard36        7906  non-null values
GiftTimeLast         9686  non-null values
GiftTimeFirst        9686  non-null values
PromCnt12            9686  non-null values
PromCnt36            9686  non-null values
PromCntAll           9686  non-null values
PromCntCard12        9686  non-null values
PromCntCard36        9686  non-null values
PromCntCardAll       9686  non-null values
StatusCat96NK [A]    9686  non-null values
StatusCat96NK [E]    9686  non-null values
StatusCat96NK [F]    9686  non-null values
StatusCat96NK [L]    9686  non-null values
StatusCat96NK [N]    9686  non-null values
StatusCat96NK [S]    9686  non-null values
StatusCatStarAll     9686  non-null values
DemCluster           9686  non-null values
DemAge               7279  non-null values
DemGender [F]        9686  non-null values
DemGender [M]        9686  non-null values
DemGender [U]        9686  non-null values
DemHomeOwner [H]     9686  non-null values
DemHomeOwner [U]     9686  non-null values
DemMedHomeValue      9686  non-null values
DemPctVeterans       9686  non-null values
DemMedIncome         9686  non-null values
dtypes: float64(7), int64(26)

	Role	Type
TARGET_B	Input	Number
ID	ID	Number
TARGET_D	Input	Money
GiftCnt36	Input	Number
GiftCntAll	Input	Number
GiftCntCard36	Input	Number
GiftCntCardAll	Input	Number
GiftAvgLast	Input	Money
GiftAvg36	Input	Money
GiftAvgAll	Input	Money
GiftAvgCard36	Input	Money
GiftTimeLast	Input	Number
GiftTimeFirst	Input	Number
PromCnt12	Input	Number
PromCnt36	Input	Number
PromCntAll	Input	Number
PromCntCard12	Input	Number
PromCntCard36	Input	Number
PromCntCardAll	Input	Number
StatusCat96NK	Input	Category
StatusCatStarAll	Input	Number
DemCluster	Input	Number
DemAge	Input	Number
DemGender	Input	Category
DemHomeOwner	Input	Category
DemMedHomeValue	Input	Money
DemPctVeterans	Input	Number
DemMedIncome	Input	Money

	Role	Type
TARGET_B	Target	Number
ID	ID	Category
TARGET_D	Rejected	Money

Copper - Easy data analysis and machine learning on python

Copper¶

Importing¶

Metadata¶

Histograms¶

Inputs¶

Conclusion¶