Pandas Basics
Essential Pandas operations for DataFrames, data manipulation, and analysis.
Import & DataFrames
import pandas as pd
# Create DataFrame from dictionary
df = pd.DataFrame({
'name': ['Alice', 'Bob'],
'age': [25, 30]
})
# Read from CSV file
df = pd.read_csv('data.csv') # load CSV file
df = pd.read_excel('data.xlsx') # load Excel file
Viewing Data
df.head(5) # first 5 rows
df.tail(3) # last 3 rows
df.info() # data types and non-null counts
df.describe() # statistical summary
df.shape # (rows, columns)
df.columns # column names
Selecting Data
# Select single column
df['name'] # returns Series
df[['name', 'age']] # multiple columns, returns DataFrame
# Select rows
df.loc[0] # by label/index
df.iloc[0] # by integer position
df.loc[0:2] # slice by label
# Filter rows
df[df['age'] > 25] # filter by condition
Modify Data
# Add column
df['new_col'] = 0 # add with constant value
df['total'] = df['a'] + df['b'] # calculated column
# Drop column
df.drop('name', axis=1) # axis=1 for columns
df.drop(['a', 'b'], axis=1) # drop multiple
# Sort
df.sort_values('age') # ascending
df.sort_values('age', ascending=False) # descending
# Group by
df.groupby('name').mean() # average by group