patrickramos commited on
Commit
1c13beb
·
1 Parent(s): 85abf34

Update list of manual names

Browse files
Files changed (1) hide show
  1. data.py +5 -3
data.py CHANGED
@@ -295,7 +295,7 @@ translated_df = (
295
  .otherwise(pl.col('name_en'))
296
  .alias('name_en')
297
  )
298
- .with_columns(pl.col('name_en').str.replace_all(',', '').str.to_titlecase())
299
  )
300
 
301
  # handle inconsistent kanji between sources
@@ -330,9 +330,11 @@ players_df = (
330
  )
331
  )
332
  print(players_df.filter(pl.len().over('playerId', 'team', 'season') > 1))
333
- players_df = pl.concat((players_df.group_by('playerId').agg(pl.first('name_en')), manual_translated_df[['playerId', 'name_en']])).unique()
 
 
 
334
  print(players_df.filter(pl.len().over('playerId') > 1).sort('playerId'))
335
- players_df = players_df.group_by('playerId').agg(pl.first('name_en'))
336
 
337
  # join players to data
338
  data_df = (
 
295
  .otherwise(pl.col('name_en'))
296
  .alias('name_en')
297
  )
298
+ .with_columns(pl.when(pl.col('name_en') == pl.col('name_en').str.to_uppercase()).then(pl.col('name_en').str.to_titlecase()).otherwise('name_en').str.replace_all(',', ''))
299
  )
300
 
301
  # handle inconsistent kanji between sources
 
330
  )
331
  )
332
  print(players_df.filter(pl.len().over('playerId', 'team', 'season') > 1))
333
+ players_df = pl.concat((
334
+ players_df.group_by('playerId').agg(pl.first('name_en')),
335
+ manual_translated_df[['playerId', 'name_en']]
336
+ )).unique()
337
  print(players_df.filter(pl.len().over('playerId') > 1).sort('playerId'))
 
338
 
339
  # join players to data
340
  data_df = (