import pandas as pd
from IPython.display import display, HTML

CSS = """
.output {
    flex-direction: row;
}
"""
HTML('<style>{}</style>'.format(CSS))

df = pd.DataFrame({'prix': [1.1, 0.8, 0.6], 'stock': [0, 22, 51]},  # columns are stored in a dictionnary
                  index = ['stylo','crayon','gomme'])

# another way to do the same dataframe. The list shape is index x columns:

df_bis = pd.DataFrame([[1.1, 0], [0.8, 22], [0.6, 51]],
                      index = ['stylo','crayon','gomme'],
                      columns = ['prix', 'stocks'])
display(df, df_bis)

print(df.prix, '\n')
print(df['prix'], '\n')     # use brackets when the name is a keyword or has spaces or accents
print(type(df.prix))

stylo     1.1
crayon    0.8
gomme     0.6
Name: prix, dtype: float64 

stylo     1.1
crayon    0.8
gomme     0.6
Name: prix, dtype: float64 

<class 'pandas.core.series.Series'>

df2 = pd.DataFrame({'prix': df.prix,    # we copy column 'prix' of df
                    'stock': df.stock, 
                    'promo': pd.Series([0.2,0,0.05], index=['stylo','papier','crayon']) # Series with different index
                   })
df2

print(df2.prix.index)
print(df2.prix.values)

Index(['crayon', 'gomme', 'papier', 'stylo'], dtype='object')
[0.8 0.6 nan 1.1]

print(df2.index)
print(df2.values)

Index(['crayon', 'gomme', 'papier', 'stylo'], dtype='object')
[[8.0e-01 2.2e+01 5.0e-02]
 [6.0e-01 5.1e+01     nan]
 [    nan     nan 0.0e+00]
 [1.1e+00 0.0e+00 2.0e-01]]

df2.columns

Index(['prix', 'stock', 'promo'], dtype='object')

df.gomme

---------------------------------------------------------------------------
AttributeError                            Traceback (most recent call last)
/tmp/ipykernel_701/1153377621.py in ?()
----> 1 df.gomme

/opt/conda/lib/python3.11/site-packages/pandas/core/generic.py in ?(self, name)
   6292             and name not in self._accessors
   6293             and self._info_axis._can_hold_identifiers_and_holds_name(name)
   6294         ):
   6295             return self[name]
-> 6296         return object.__getattribute__(self, name)

AttributeError: 'DataFrame' object has no attribute 'gomme'

df2.loc['crayon']

prix      0.80
stock    22.00
promo     0.05
Name: crayon, dtype: float64

df2.loc[['gomme','crayon'],:'stock']

print(df2.iloc[0,0])
df2.iloc[0:2, :]

0.8

df2[['prix','stock']][0:2] # may seems more natural but is less efficient

print(df2.at['gomme', 'stock'])   # same than loc['gomme', 'stock'] buy faster
print(df2.iat[1, 0])

51.0
0.6

df2.loc[df2.promo > 0, 'promo'] += 0.10  # we add 10% sales for products already in sales
df2

df2.query('0.1 < promo < 0.3')

df2.loc[df2.query('promo > 0').index, 'promo'] += 0.1   # it includes a partial copy of df2

print("Stock value = %f\n" % (df.prix * df.stock).sum())

Stock value = 48.200000

import numpy as np

np.sin(df2.promo)  # just to show that it can be done

crayon    0.247404
gomme          NaN
papier    0.000000
stylo     0.389418
Name: promo, dtype: float64

`query`	Python
`'A in B'`	`df[df.A.isin(df.B)]`
`'A not in B'`	`df[~df.A.isin(df.B)]`
`'C in [1,2,4,8]`	`df[df.C.isin([1,2,4,8])]`
`'A == 3 and A > B > C'`	`df[(df['A'] == 3) & (df['A'] > df['B']) & (df['B'] > df['C'])]`

Structure du `DataFrame`¶

Sélectionner une partie du tableau¶

Le piège de l'indexation (loc et iloc)¶

Optimisation (at & iat)¶

Les filtres logiques¶

Query¶

Agir globalement¶

Plus¶

	prix	stock	promo
crayon	0.8	22.0	0.05
gomme	0.6	51.0	NaN
papier	NaN	NaN	0.00
stylo	1.1	0.0	0.20

	prix	stock	promo
crayon	0.8	22.0	0.15
gomme	0.6	51.0	NaN
papier	NaN	NaN	0.00
stylo	1.1	0.0	0.30

Structure du DataFrame¶

Sélectionner une partie du tableau¶

Le piège de l'indexation (loc et iloc)¶

Optimisation (at & iat)¶

Les filtres logiques¶

Query¶

Agir globalement¶

Plus¶

Structure du `DataFrame`¶