1 2 3 4 5 6 7 8 9 10 11 12 13 14 15
| >>> import pandas as pd
>>> df = pd.DataFrame({
... 'Colonne A' : [2001008799, 2001008799, 2001008799, 2000261690, 2000261690, 2000261690, 2000261690],
... 'Colonne B' : [9791820, 9791842, 9791843, 50016, 50023, 50024, 50069]
... })
>>> df['Besoin'] = df.groupby('Colonne A')['Colonne B'].transform(lambda x: pd.factorize(x)[0]+1)
>>> df
Colonne A Colonne B Besoin
0 2001008799 9791820 1
1 2001008799 9791842 2
2 2001008799 9791843 3
3 2000261690 50016 1
4 2000261690 50023 2
5 2000261690 50024 3
6 2000261690 50069 4 |
Partager