Vitaliy_Novichikhin

спринт 5 4.7 Переименование столбцов верное решение

Apr 8th, 2022 (edited)
716
0
Never
Not a member of Pastebin yet? Sign Up, it unlocks many cool features!
Python 1.05 KB | None | 0 0
  1. import pandas as pd
  2.  
  3. data = pd.read_csv('/datasets/visits.csv', sep='\t')
  4.  
  5. # фильтруем слишком быстрые и медленные заезды и АЗС
  6. data['too_fast'] = data['time_spent'] < 60
  7. data['too_slow'] = data['time_spent'] > 1000
  8. too_fast_stat = data.pivot_table(index='id', values='too_fast')
  9. good_ids = too_fast_stat.query('too_fast < 0.5')
  10. good_data = data.query('id in @good_ids.index and 60 <= time_spent <= 1000')
  11.  
  12. # считаем данные по отдельным АЗС и по сетям
  13. station_stat = data.pivot_table(index='id', values='time_spent', aggfunc='median')
  14. good_stations_stat = good_data.pivot_table(index='id', values='time_spent', aggfunc='median')
  15.  
  16. stat = data.pivot_table(index='name', values='time_spent')
  17. good_stat = good_data.pivot_table(index='name', values='time_spent', aggfunc='median')
  18. stat['good_time_spent'] = good_stat['time_spent']
  19.  
  20. id_name = good_data.pivot_table(index='id', values='name', aggfunc=['first', 'count'])
  21.  
  22. id_name.columns = ['name', 'count']
  23.  
  24. print(id_name.head())
Add Comment
Please, Sign In to add comment