Advertisement
Not a member of Pastebin yet?
Sign Up,
it unlocks many cool features!
- def drop_dublicate(data):
- temp_df = pd.concat([data, data.duplicated(subset=['ogrn','press_release_link', 'company_link', '_date', 'rating', 'fin_instrument'])], axis=1)
- print(temp_df)
- stop = 0
- if __name__ == '__main__':
- # data = pd.read_excel('.xlsx')
- # check_regions(data) #TODO done it, new version in last_output.xlsx
- data = pd.read_excel('')
- drop_dublicate(data)
Advertisement
Add Comment
Please, Sign In to add comment
Advertisement