Spaces:
Running
Running
Commit
·
1c13beb
1
Parent(s):
85abf34
Update list of manual names
Browse files
data.py
CHANGED
|
@@ -295,7 +295,7 @@ translated_df = (
|
|
| 295 |
.otherwise(pl.col('name_en'))
|
| 296 |
.alias('name_en')
|
| 297 |
)
|
| 298 |
-
.with_columns(pl.col('name_en').str.
|
| 299 |
)
|
| 300 |
|
| 301 |
# handle inconsistent kanji between sources
|
|
@@ -330,9 +330,11 @@ players_df = (
|
|
| 330 |
)
|
| 331 |
)
|
| 332 |
print(players_df.filter(pl.len().over('playerId', 'team', 'season') > 1))
|
| 333 |
-
players_df = pl.concat((
|
|
|
|
|
|
|
|
|
|
| 334 |
print(players_df.filter(pl.len().over('playerId') > 1).sort('playerId'))
|
| 335 |
-
players_df = players_df.group_by('playerId').agg(pl.first('name_en'))
|
| 336 |
|
| 337 |
# join players to data
|
| 338 |
data_df = (
|
|
|
|
| 295 |
.otherwise(pl.col('name_en'))
|
| 296 |
.alias('name_en')
|
| 297 |
)
|
| 298 |
+
.with_columns(pl.when(pl.col('name_en') == pl.col('name_en').str.to_uppercase()).then(pl.col('name_en').str.to_titlecase()).otherwise('name_en').str.replace_all(',', ''))
|
| 299 |
)
|
| 300 |
|
| 301 |
# handle inconsistent kanji between sources
|
|
|
|
| 330 |
)
|
| 331 |
)
|
| 332 |
print(players_df.filter(pl.len().over('playerId', 'team', 'season') > 1))
|
| 333 |
+
players_df = pl.concat((
|
| 334 |
+
players_df.group_by('playerId').agg(pl.first('name_en')),
|
| 335 |
+
manual_translated_df[['playerId', 'name_en']]
|
| 336 |
+
)).unique()
|
| 337 |
print(players_df.filter(pl.len().over('playerId') > 1).sort('playerId'))
|
|
|
|
| 338 |
|
| 339 |
# join players to data
|
| 340 |
data_df = (
|