数据提取
import pandas as pd from sqlalchemy import create_engine # 从数据库提取 engine = create_engine('sqlite:///data.db') df = pd.read_sql('SELECT * FROM users', engine) # 从API提取 import requests response = requests.get('https://api.example.com/data') data = response.json()
数据转换
# 数据清洗 df = df.dropna() # 删除空值 df = df.drop_duplicates() # 删除重复 # 数据类型转换 df['date'] = pd.to_datetime(df['date']) df['amount'] = pd.to_numeric(df['amount'])
转载请注明:周志洋的博客 » Python数据分析-ETL数据处理