|
166 | 166 | "outputs": [], |
167 | 167 | "source": [ |
168 | 168 | "# Note that pd.read_csv is used because we imported pandas as pd\n", |
169 | | - "surveys_df = pd.read_csv(\"../data/surveys.csv\")" |
| 169 | + "surveys_df = pd.read_csv('../data/surveys.csv')" |
170 | 170 | ] |
171 | 171 | }, |
172 | 172 | { |
|
182 | 182 | "outputs": [], |
183 | 183 | "source": [ |
184 | 184 | "# Note that pd.read_csv is used because we imported pandas as pd\n", |
185 | | - "pd.read_csv(\"../data/surveys.csv\")" |
| 185 | + "pd.read_csv('../data/surveys.csv')" |
186 | 186 | ] |
187 | 187 | }, |
188 | 188 | { |
|
972 | 972 | " * **Sélection** : `df['nom_colonne']`\n", |
973 | 973 | " * **Méthodes** :\n", |
974 | 974 | " * Statistiques descriptives :\n", |
975 | | - " `count()`, `mean()`, `std()`, `min()`, `median()`, `max()`\n", |
976 | | - " * Autres : `describe()`, `nunique()`, `unique()`\n", |
| 975 | + " * `count()`, `mean()`, `std()`\n", |
| 976 | + " * `min()`, `median()`, `max()`\n", |
| 977 | + " * `nunique()`, `unique()`\n", |
| 978 | + " * Sommaire statistique : `describe()`\n", |
977 | 979 | "* **Grouper selon les valeurs** d'une ou plusieurs colonnes :\n", |
978 | 980 | " * `groupby(nom_col)`\n", |
979 | 981 | " * `groupby([nom_col1, nom_col2])`\n", |
| 982 | + " * Statistiques descriptives : `aggregate([fonction1, ...])`\n", |
980 | 983 | "* **Tableaux croisés dynamiques**\n", |
981 | 984 | " * Transformation selon les valeurs de l'index : `unstack()`\n", |
982 | | - " * Aggrégation dans un tableau croisé dynamique : `pivot_table()`" |
| 985 | + " * Aggrégation dans un tableau croisé dynamique : `pivot_table()`\n", |
| 986 | + " * `values=colX`\n", |
| 987 | + " * `index=[col_ind]`\n", |
| 988 | + " * `columns=[categorie1, categorie2]`\n", |
| 989 | + " * `aggfunc=fonction` (défaut: moyenne)" |
983 | 990 | ] |
984 | 991 | }, |
985 | 992 | { |
|
1001 | 1008 | " * **Selection**: `df['column_name']`\n", |
1002 | 1009 | " * **Methods**:\n", |
1003 | 1010 | " * Descriptive statistics:\n", |
1004 | | - " `count()`, `mean()`, `std()`, `min()`, `median()`, `max()`\n", |
1005 | | - " * Others: `describe()`, `nunique()`, `unique()`\n", |
| 1011 | + " * `count()`, `mean()`, `std()`\n", |
| 1012 | + " * `min()`, `median()`, `max()`\n", |
| 1013 | + " * `nunique()`, `unique()`\n", |
| 1014 | + " * Statistical summary: `describe()`\n", |
1006 | 1015 | "* **Grouping by values** of one or many columns:\n", |
1007 | 1016 | " * `groupby(column_name)`\n", |
1008 | 1017 | " * `groupby([column_name1, column_name2])`\n", |
| 1018 | + " * Descriptive statistics: `aggregate([function1, ...])`\n", |
1009 | 1019 | "* **Pivot tables**\n", |
1010 | 1020 | " * Reshaping a DataFrame from values in the index: `unstack()`\n", |
1011 | | - " * Aggregation in a pivot table: `pivot_table()`" |
| 1021 | + " * Aggregation in a pivot table: `pivot_table()`\n", |
| 1022 | + " * `values=colX`\n", |
| 1023 | + " * `index=[col_ind]`\n", |
| 1024 | + " * `columns=[category1, category2]`\n", |
| 1025 | + " * `aggfunc=function` (default: mean)" |
1012 | 1026 | ] |
1013 | 1027 | }, |
1014 | 1028 | { |
|
0 commit comments