Pandas数据分析

from datetime import timedelta
from pandas import DataFrame
from scipy import stats
import matplotlib.pyplot as plt
import numpy as np
import pandas as pd
import seaborn as sns

path = 'links_date.csv'

# Open original data
parse_dates = ['start', 'end']
df = pd.read_csv(path, index_col='tmdbId', parse_dates=parse_dates)

# Drop null data
df.dropna(inplace=True)

# Fill null data
# df.fillna(0, inplace=True)

# Obtain hourly data
df['DELTATIME'] = df['end'] - df['start']

# Select column
df = df[df['DELTATIME'] == timedelta(hours=1)]

# Drop column
df.drop('DELTATIME', axis=1, inplace=True)

# Handle data

 

posted on 2017-08-07 23:44  Apple@Jing  阅读(251)  评论(0编辑  收藏  举报

导航