python_pandas_9 - 8BitsCoding/RobotMentor GitHub Wiki

import pandas as pd

student_list = [{'name': 'John', 'major': "Computer Science", 'sex': "male"},
                {'name': 'Nate', 'major': "Computer Science", 'sex': "male"},
                {'name': 'Edward', 'major': "Computer Science", 'sex': "male"},
                {'name': 'Zara', 'major': "Psychology", 'sex': "female"},
                {'name': 'John', 'major': "Computer Science", 'sex': "male"}]

df = pd.DataFrame(student_list, columns = ['name', 'major', 'sex'])
df.duplicated()

μ–΄λ””μ„œ μ€‘λ³΅λœ 값이 μ‘΄μž¬ν•˜λŠ”μ§€ ν‘œμ‹œ

df.drop_duplicates()

μ€‘λ³΅λœ λ°μ΄ν„°λŠ” 제거

df.duplicated(['name'])

name열에 쀑볡이 μžˆμ„κ²½μš° ν‘œμ‹œ

df.drop_duplicates(['name'], keep='first'#'last')

name열에 쀑볡이 μžˆμ„κ²½μš° 제거