|
976 | 976 | }
|
977 | 977 | ],
|
978 | 978 | "source": [
|
979 |
| - "sexes = sort(df_train['Sex'].unique())\n", |
| 979 | + "sexes = sorted(df_train['Sex'].unique())\n", |
980 | 980 | "genders_mapping = dict(zip(sexes, range(0, len(sexes) + 1)))\n",
|
981 | 981 | "genders_mapping"
|
982 | 982 | ]
|
|
1220 | 1220 | ],
|
1221 | 1221 | "source": [
|
1222 | 1222 | "# Get the unique values of Pclass:\n",
|
1223 |
| - "passenger_classes = sort(df_train['Pclass'].unique())\n", |
| 1223 | + "passenger_classes = sorted(df_train['Pclass'].unique())\n", |
1224 | 1224 | "\n",
|
1225 | 1225 | "for p_class in passenger_classes:\n",
|
1226 | 1226 | " print 'M: ', p_class, len(df_train[(df_train['Sex'] == 'male') & \n",
|
|
1430 | 1430 | ],
|
1431 | 1431 | "source": [
|
1432 | 1432 | "# Get the unique values of Embarked\n",
|
1433 |
| - "embarked_locs = sort(df_train['Embarked'].unique())\n", |
| 1433 | + "embarked_locs = sorted(df_train['Embarked'].unique())\n", |
1434 | 1434 | "\n",
|
1435 | 1435 | "embarked_locs_mapping = dict(zip(embarked_locs, \n",
|
1436 | 1436 | " range(0, len(embarked_locs) + 1)))\n",
|
|
1682 | 1682 | }
|
1683 | 1683 | ],
|
1684 | 1684 | "source": [
|
1685 |
| - "embarked_locs = sort(df_train['Embarked_Val'].unique())\n", |
| 1685 | + "embarked_locs = sorted(df_train['Embarked_Val'].unique())\n", |
1686 | 1686 | "embarked_locs"
|
1687 | 1687 | ]
|
1688 | 1688 | },
|
|
2393 | 2393 | ],
|
2394 | 2394 | "source": [
|
2395 | 2395 | "# Get the unique values of Embarked and its maximum\n",
|
2396 |
| - "family_sizes = sort(df_train['FamilySize'].unique())\n", |
| 2396 | + "family_sizes = sorted(df_train['FamilySize'].unique())\n", |
2397 | 2397 | "family_size_max = max(family_sizes)\n",
|
2398 | 2398 | "\n",
|
2399 | 2399 | "df1 = df_train[df_train['Survived'] == 0]['FamilySize']\n",
|
|
2581 | 2581 | "def clean_data(df, drop_passenger_id):\n",
|
2582 | 2582 | " \n",
|
2583 | 2583 | " # Get the unique values of Sex\n",
|
2584 |
| - " sexes = sort(df['Sex'].unique())\n", |
| 2584 | + " sexes = sorted(df['Sex'].unique())\n", |
2585 | 2585 | " \n",
|
2586 | 2586 | " # Generate a mapping of Sex from a string to a number representation \n",
|
2587 | 2587 | " genders_mapping = dict(zip(sexes, range(0, len(sexes) + 1)))\n",
|
|
2590 | 2590 | " df['Sex_Val'] = df['Sex'].map(genders_mapping).astype(int)\n",
|
2591 | 2591 | " \n",
|
2592 | 2592 | " # Get the unique values of Embarked\n",
|
2593 |
| - " embarked_locs = sort(df['Embarked'].unique())\n", |
| 2593 | + " embarked_locs = sorted(df['Embarked'].unique())\n", |
2594 | 2594 | "\n",
|
2595 | 2595 | " # Generate a mapping of Embarked from a string to a number representation \n",
|
2596 | 2596 | " embarked_locs_mapping = dict(zip(embarked_locs, \n",
|
|
0 commit comments