Advertisement
Not a member of Pastebin yet?
Sign Up,
it unlocks many cool features!
- import pandas as pd
- import numpy as np
- df = pd.DataFrame({'value': np.random.randint(0, 100, 20)})
- labels = ["{0} - {1}".format(i, i + 9) for i in range(0, 100, 10)]
- df['range'] = pd.cut(df.value, range(0, 105, 10), right=False, labels=labels)
- df['relation'] = pd.DataFrame({'value': np.random.randint(0, 100, 20)})
- df['answer'] = np.tile(['good', 'bad', 'average'], df.index.size)[:df.index.size]
- df['answer'] = df['answer'].astype('category')
- In [2]: df.head(10)
- Out[2]:
- value range relation answer
- 0 16 10 - 19 19 good
- 1 52 50 - 59 61 bad
- 2 19 10 - 19 83 average
- 3 23 20 - 29 43 good
- 4 18 10 - 19 44 bad
- 5 41 40 - 49 86 average
- 6 52 50 - 59 40 good
- 7 78 70 - 79 74 bad
- 8 30 30 - 39 82 average
- 9 63 60 - 69 27 good
Advertisement
Add Comment
Please, Sign In to add comment
Advertisement