import pandas as pd
df = pd.DataFrame()
df

data = [1,2,3,4,5]
df = pd.DataFrame(data)
df

import pandas as pd
data = [['Alex',10],['Bob',12],['Clarke',13]]
df = pd.DataFrame(data,columns=['Name','Age'])
df

data = [['Alex',10],['Bob',12],['Clarke',13]]
df = pd.DataFrame(data,columns=['Name','Age'])

df['Age'] = df['Age'].astype(float)

df

data = {'Name':['Tom', 'Jack', 'Steve', 'Ricky'],'Age':[28,34,29,42]}
df = pd.DataFrame(data)
df

data = {'Name':['Tom', 'Jack', 'Steve', 'Ricky'],'Age':[28,34,29,42]}
df = pd.DataFrame(data, index=['rank1','rank2','rank3','rank4'])
df

data = [{'a': 1, 'b': 2},{'a': 5, 'b': 10, 'c': 20}]
df = pd.DataFrame(data)
df

data = [{'a': 1, 'b': 2},{'a': 5, 'b': 10, 'c': 20}]
df = pd.DataFrame(data, index=['first', 'second'])
df

data = [{'a': 1, 'b': 2},{'a': 5, 'b': 10, 'c': 20}]

df1 = pd.DataFrame(data, index=['first', 'second'], columns=['a', 'b'])

df2 = pd.DataFrame(data, index=['first', 'second'], columns=['a', 'b1'])
print(df1)

        a   b
first   1   2
second  5  10

print(df2)

        a  b1
first   1 NaN
second  5 NaN

d = {'one' : pd.Series([1, 2, 3], index=['a', 'b', 'c']),
     'two' : pd.Series([1, 2, 3, 4], index=['a', 'b', 'c', 'd'])}
df = pd.DataFrame(d)
df

d = {'one' : pd.Series([1, 2, 3], index=['a', 'b', 'c']),
     'two' : pd.Series([1, 2, 3, 4], index=['a', 'b', 'c', 'd'])}
df = pd.DataFrame(d)
df ['one']

a    1.0
b    2.0
c    3.0
d    NaN
Name: one, dtype: float64

d = {'one' : pd.Series([1, 2, 3], index=['a', 'b', 'c']),
     'two' : pd.Series([1, 2, 3, 4], index=['a', 'b', 'c', 'd'])}
df = pd.DataFrame(d)

print ("Adding a new column by passing as Series:")

Adding a new column by passing as Series:

df['three']=pd.Series([10,20,30],index=['a','b','c'])
print(df)

   one  two  three
a  1.0    1   10.0
b  2.0    2   20.0
c  3.0    3   30.0
d  NaN    4    NaN

print ("Adding a new column using the existing columns in DataFrame:")

Adding a new column using the existing columns in DataFrame:

df['four']=df['one']+df['three']

print(df)

   one  two  three  four
a  1.0    1   10.0  11.0
b  2.0    2   20.0  22.0
c  3.0    3   30.0  33.0
d  NaN    4    NaN   NaN

# Using the previous DataFrame, we will delete a column
# using del function
import pandas as pd

d = {'one' : pd.Series([1, 2, 3], index=['a', 'b', 'c']), 
     'two' : pd.Series([1, 2, 3, 4], index=['a', 'b', 'c', 'd']), 
     'three' : pd.Series([10,20,30], index=['a','b','c'])}

df = pd.DataFrame(d)
print ("Our dataframe is:")

Our dataframe is:

print(df)

   one  two  three
a  1.0    1   10.0
b  2.0    2   20.0
c  3.0    3   30.0
d  NaN    4    NaN

# using del function
print ("Deleting the first column using DEL function:")

Deleting the first column using DEL function:

del df['one']
print(df)

   two  three
a    1   10.0
b    2   20.0
c    3   30.0
d    4    NaN

# using pop function
print ("Deleting another column using POP function:")

Deleting another column using POP function:

df.pop('two')
print(df)

   three
a   10.0
b   20.0
c   30.0
d    NaN

import pandas as pd

d = {'one' : pd.Series([1, 2, 3], index=['a', 'b', 'c']), 
     'two' : pd.Series([1, 2, 3, 4], index=['a', 'b', 'c', 'd'])}

df = pd.DataFrame(d)
print(df.loc['b'])

one    2.0
two    2.0
Name: b, dtype: float64

import pandas as pd

d = {'one' : pd.Series([1, 2, 3], index=['a', 'b', 'c']),
     'two' : pd.Series([1, 2, 3, 4], index=['a', 'b', 'c', 'd'])}

df = pd.DataFrame(d)
print(df.iloc[2])

one    3.0
two    3.0
Name: c, dtype: float64

import pandas as pd

d = {'one' : pd.Series([1, 2, 3], index=['a', 'b', 'c']), 
    'two' : pd.Series([1, 2, 3, 4], index=['a', 'b', 'c', 'd'])}

df = pd.DataFrame(d)
print(df[2:4])

   one  two
c  3.0    3
d  NaN    4

import pandas as pd

df = pd.DataFrame([[1, 2], [3, 4]], columns = ['a','b'])
df2 = pd.DataFrame([[5, 6], [7, 8]], columns = ['a','b'])
df = pd.concat([df, df2], ignore_index=True)

print(df)

   a  b
0  1  2
1  3  4
2  5  6
3  7  8

import pandas as pd

df = pd.DataFrame([[1, 2], [3, 4]], columns = ['a','b'])
df2 = pd.DataFrame([[5, 6], [7, 8]], columns = ['a','b'])

df = pd.concat([df, df2], ignore_index=True)
# Drop rows with label 0
df = df.drop(0)

print(df)

   a  b
1  3  4
2  5  6
3  7  8

创建数据帧

从列表创建DataFrame

从 `ndarrays` / `Lists` 的字典来创建DataFrame

从列表创建数据帧DataFrame

从系列的字典来创建DataFrame

列选择

列添加

列删除

行的选择、添加和删除

标签选择

行切片

附加行

删除行

① 阅读使用手册

② 注册用户账号

介绍

平台内核

注意事项

	Name	Age
0	Alex	10
1	Bob	12
2	Clarke	13

	Name	Age
0	Alex	10.0
1	Bob	12.0
2	Clarke	13.0

	Name	Age
0	Tom	28
1	Jack	34
2	Steve	29
3	Ricky	42

	Name	Age
rank1	Tom	28
rank2	Jack	34
rank3	Steve	29
rank4	Ricky	42

创建数据帧

从列表创建DataFrame

从 ndarrays / Lists 的字典来创建DataFrame

从列表创建数据帧DataFrame

从系列的字典来创建DataFrame

列选择

列添加

列删除

行的选择、添加和删除

标签选择

行切片

附加行

删除行

① 阅读使用手册

② 注册用户账号

③ 登陆

Python基础

Python进阶

标准类库

专题工具

图像处理

科学计算

自然语言

开源GIS

R 编程语言

Julia编程语言

介绍

平台内核

注意事项

从 `ndarrays` / `Lists` 的字典来创建DataFrame