1.初识数组对象¶

import numpy as np
np.__version__

'1.14.0'

data = np.array([1,2,3,4,5])
data

array([1, 2, 3, 4, 5])

type(data)

numpy.ndarray

dir(data)

['T',
 '__abs__',
 '__add__',
 '__and__',
 '__array__',
 '__array_finalize__',
 '__array_interface__',
 '__array_prepare__',
 '__array_priority__',
 '__array_struct__',
 '__array_ufunc__',
 '__array_wrap__',
 '__bool__',
 '__class__',
 '__complex__',
 '__contains__',
 '__copy__',
 '__deepcopy__',
 '__delattr__',
 '__delitem__',
 '__dir__',
 '__divmod__',
 '__doc__',
 '__eq__',
 '__float__',
 '__floordiv__',
 '__format__',
 '__ge__',
 '__getattribute__',
 '__getitem__',
 '__gt__',
 '__hash__',
 '__iadd__',
 '__iand__',
 '__ifloordiv__',
 '__ilshift__',
 '__imatmul__',
 '__imod__',
 '__imul__',
 '__index__',
 '__init__',
 '__init_subclass__',
 '__int__',
 '__invert__',
 '__ior__',
 '__ipow__',
 '__irshift__',
 '__isub__',
 '__iter__',
 '__itruediv__',
 '__ixor__',
 '__le__',
 '__len__',
 '__lshift__',
 '__lt__',
 '__matmul__',
 '__mod__',
 '__mul__',
 '__ne__',
 '__neg__',
 '__new__',
 '__or__',
 '__pos__',
 '__pow__',
 '__radd__',
 '__rand__',
 '__rdivmod__',
 '__reduce__',
 '__reduce_ex__',
 '__repr__',
 '__rfloordiv__',
 '__rlshift__',
 '__rmatmul__',
 '__rmod__',
 '__rmul__',
 '__ror__',
 '__rpow__',
 '__rrshift__',
 '__rshift__',
 '__rsub__',
 '__rtruediv__',
 '__rxor__',
 '__setattr__',
 '__setitem__',
 '__setstate__',
 '__sizeof__',
 '__str__',
 '__sub__',
 '__subclasshook__',
 '__truediv__',
 '__xor__',
 'all',
 'any',
 'argmax',
 'argmin',
 'argpartition',
 'argsort',
 'astype',
 'base',
 'byteswap',
 'choose',
 'clip',
 'compress',
 'conj',
 'conjugate',
 'copy',
 'ctypes',
 'cumprod',
 'cumsum',
 'data',
 'diagonal',
 'dot',
 'dtype',
 'dump',
 'dumps',
 'fill',
 'flags',
 'flat',
 'flatten',
 'getfield',
 'imag',
 'item',
 'itemset',
 'itemsize',
 'max',
 'mean',
 'min',
 'nbytes',
 'ndim',
 'newbyteorder',
 'nonzero',
 'partition',
 'prod',
 'ptp',
 'put',
 'ravel',
 'real',
 'repeat',
 'reshape',
 'resize',
 'round',
 'searchsorted',
 'setfield',
 'setflags',
 'shape',
 'size',
 'sort',
 'squeeze',
 'std',
 'strides',
 'sum',
 'swapaxes',
 'take',
 'tobytes',
 'tofile',
 'tolist',
 'tostring',
 'trace',
 'transpose',
 'var',
 'view']

data?

# 数组元素的类型
data.dtype

dtype('int64')

# 修改数组类型
new_data = data.astype(np.float)
new_data

array([1., 2., 3., 4., 5.])

new_data.dtype

dtype('float64')

data,data.dtype

(array([1, 2, 3, 4, 5]), dtype('int64'))

# 数组的外貌
a = np.array([1,2,3])
b = np.array([1.0,2.0,3.0])
a.dtype,b.dtype

(dtype('int64'), dtype('float64'))

a.shape

(3,)

b.shape

(3,)

c = np.array([1.0,2.0,3.0,4.0])
c.shape

(4,)

# 维度
a.ndim

1

# 返回元素个数
a.size

3

c.size

4

常用属性¶

dtype:返回数组元素的类型
shape:返回一个元组，元组中的每个整数依次对应数组的每个轴的元素个数
size:返回数组中元素个数
ndim:返回数组维度
nbytes:返回保存数据的字节数

2.创建数组¶

np.array?

a = np.array([1,2,3,4])
b = np.array([1,2,3,4],dtype=float)

a

array([1, 2, 3, 4])

a.dtype

dtype('int64')

a.shape

(4,)

a.size

4

a.ndim

1

b

array([1., 2., 3., 4.])

b.dtype

dtype('float64')

# 多维数组,数组的元素类型必须一致
da = np.array([[1,2,3,4],[5,6,7,8],[9,10,11,12]])
da

array([[ 1,  2,  3,  4],
       [ 5,  6,  7,  8],
       [ 9, 10, 11, 12]])

np.array([[1,2,3],[4,5,6,7],[8,9]])

array([list([1, 2, 3]), list([4, 5, 6, 7]), list([8, 9])], dtype=object)

da.shape

(3, 4)

da.size

12

db = np.array([[1,2,3,4,5,6,7]],ndmin=2)
db

array([[1, 2, 3, 4, 5, 6, 7]])

db.shape

(1, 7)

db.ndim

2

dc = np.array([1,2,3,4,5,6,7])
dc

array([1, 2, 3, 4, 5, 6, 7])

dc.shape

(7,)

dc.ndim

1

a

array([1, 2, 3, 4])

de = np.array(a,dtype=complex)
de

array([1.+0.j, 2.+0.j, 3.+0.j, 4.+0.j])

de.dtype

dtype('complex128')

# 用函数创建数组
np.zeros((2,10))

array([[0., 0., 0., 0., 0., 0., 0., 0., 0., 0.],
       [0., 0., 0., 0., 0., 0., 0., 0., 0., 0.]])

np.zeros?

# zeros(shape, dtype=float, order='C')

同一种元素的数组

np.ones((6,))

array([1., 1., 1., 1., 1., 1.])

# 一维数组才能这样写
np.ones(6)

array([1., 1., 1., 1., 1., 1.])

da

array([[ 1,  2,  3,  4],
       [ 5,  6,  7,  8],
       [ 9, 10, 11, 12]])

da.shape

(3, 4)

np.ones(da.shape)

array([[1., 1., 1., 1.],
       [1., 1., 1., 1.],
       [1., 1., 1., 1.]])

np.ones_like(da)

array([[1, 1, 1, 1],
       [1, 1, 1, 1],
       [1, 1, 1, 1]])

np.ones_like(da,dtype=np.float)

array([[1., 1., 1., 1.],
       [1., 1., 1., 1.],
       [1., 1., 1., 1.]])

df = 6.4 * np.ones_like(da)
df

array([[6.4, 6.4, 6.4, 6.4],
       [6.4, 6.4, 6.4, 6.4],
       [6.4, 6.4, 6.4, 6.4]])

对角线独特的数组

np.eye(),np.identity(),np.diag()都能创建对角线元素比较特殊而其他部分的元素为0的数组

np.eye(4,dtype=int)

array([[1, 0, 0, 0],
       [0, 1, 0, 0],
       [0, 0, 1, 0],
       [0, 0, 0, 1]])

np.eye(4,dtype=int,k=1)

array([[0, 1, 0, 0],
       [0, 0, 1, 0],
       [0, 0, 0, 1],
       [0, 0, 0, 0]])

np.eye(4,dtype=int,k=-1)

array([[0, 0, 0, 0],
       [1, 0, 0, 0],
       [0, 1, 0, 0],
       [0, 0, 1, 0]])

np.identity(4)

array([[1., 0., 0., 0.],
       [0., 1., 0., 0.],
       [0., 0., 1., 0.],
       [0., 0., 0., 1.]])

np.diag([1,2,3,4])

array([[1, 0, 0, 0],
       [0, 2, 0, 0],
       [0, 0, 3, 0],
       [0, 0, 0, 4]])

np.diag([1,2,3,4],k=1)

array([[0, 1, 0, 0, 0],
       [0, 0, 2, 0, 0],
       [0, 0, 0, 3, 0],
       [0, 0, 0, 0, 4],
       [0, 0, 0, 0, 0]])

de = np.arange(16).reshape((4,4))
de

array([[ 0,  1,  2,  3],
       [ 4,  5,  6,  7],
       [ 8,  9, 10, 11],
       [12, 13, 14, 15]])

np.diag(de)

array([ 0,  5, 10, 15])

np.diag(de,k=-1)

array([ 4,  9, 14])

元素是等差和等比的数组

# arange([start,] stop[, step,], dtype=None)
np.arange(1,100,3)

array([ 1,  4,  7, 10, 13, 16, 19, 22, 25, 28, 31, 34, 37, 40, 43, 46, 49,
       52, 55, 58, 61, 64, 67, 70, 73, 76, 79, 82, 85, 88, 91, 94, 97])

np.arange?

# np.linspace(start, stop, num=50, endpoint=True, retstep=False, dtype=None)
np.linspace(1,10,4)

array([ 1.,  4.,  7., 10.])

np.linspace?

np.logspace?

# np.logspace(start, stop, num=50, endpoint=True, base=10.0, dtype=None)
np.logspace(2,3,num=4)

array([ 100.        ,  215.443469  ,  464.15888336, 1000.        ])

import math
math.log10(215.443469)

2.333333333326906

math.log10(464.15888336)

2.666666666665471

创建自定义类型的数组

my_type = np.dtype({"names":['book','version'],"formats":['S40',np.int]})
my_type

dtype([('book', 'S40'), ('version', '<i8')])

my_books = np.array([("python",2),("java",1)],dtype=my_type)
my_books

array([(b'python', 2), (b'java', 1)],
      dtype=[('book', 'S40'), ('version', '<i8')])

# 同my_type
my_type2 = np.dtype([('book','S40'),('version','<i8')])

my_books['book']

array([b'python', b'java'], dtype='|S40')

my_books['book'][0]

b'python'

my_books[0]

(b'python', 2)

my_books[0]['book']

b'python'

# 修改记录
my_books[0]['book'] = "learn python"
my_books

array([(b'learn python', 2), (b'java', 1)],
      dtype=[('book', 'S40'), ('version', '<i8')])

数组一旦确定，其轴的数量就不能变化

用from系列函数创建数组

#s = 'hello world'
np.frombuffer(b'hello world',dtype='S1',count=5,offset=6)

array([b'w', b'o', b'r', b'l', b'd'], dtype='|S1')

np.frombuffer?

def foo(x):
    return x + 1
np.fromfunction(foo,(5,),dtype=np.int)

array([1, 2, 3, 4, 5])

np.fromfunction(lambda i,j:(i+1)*(j+1),(9,9),dtype=np.int)

array([[ 1,  2,  3,  4,  5,  6,  7,  8,  9],
       [ 2,  4,  6,  8, 10, 12, 14, 16, 18],
       [ 3,  6,  9, 12, 15, 18, 21, 24, 27],
       [ 4,  8, 12, 16, 20, 24, 28, 32, 36],
       [ 5, 10, 15, 20, 25, 30, 35, 40, 45],
       [ 6, 12, 18, 24, 30, 36, 42, 48, 54],
       [ 7, 14, 21, 28, 35, 42, 49, 56, 63],
       [ 8, 16, 24, 32, 40, 48, 56, 64, 72],
       [ 9, 18, 27, 36, 45, 54, 63, 72, 81]])

Python数据分析学习（二）：Numpy数组对象基础

1.初识数组对象¶

常用属性¶

2.创建数组¶