import numpy as np

scalar = np.array(5)
type(scalar)

numpy.ndarray

vector = np.array([1, 2, 3])
vector

array([1, 2, 3])

matrix = np.array([[1, 2, 3], [4, 5, 6], [7, 8, 9]])
matrix

array([[1, 2, 3],
       [4, 5, 6],
       [7, 8, 9]])

# 배열의 차원 확인
print(scalar.ndim, vector.ndim, matrix.ndim)

0 1 2

# 배열의 모양 확인
print(scalar.shape, vector.shape, matrix.shape)

() (3,) (3, 3)

# 문자열도 배열 데이터 생성이 가능
str_vector = np.array(list('ABCD'))
str_vector

array(['A', 'B', 'C', 'D'], dtype='<U1')

# numpy는 한 가지 데이터 타입으로만 인식
ls = [1, 2, 3, 'D']
np.array(ls)

array(['1', '2', '3', 'D'], dtype='<U21')

# .astype()으로 데이터 타입 변경
print(np.array([1, 2, 3, '4']).astype(np.float64))
print(np.array([1, 2, 3, '4']).astype(np.int64))

[1. 2. 3. 4.]
[1 2 3 4]

print(list(range(5)))
print(list(np.arange(5)))

[0, 1, 2, 3, 4]
[0, 1, 2, 3, 4]

print(list(np.arange(1, 5)))
print(list(np.arange(1, 5, 2)))  # stride = 2

[1, 2, 3, 4]
[1, 3]

mat_zero = np.zeros((2, 2, 3))
print(mat_zero)

[[[0. 0. 0.]
  [0. 0. 0.]]

 [[0. 0. 0.]
  [0. 0. 0.]]]

mat_ones = np.ones((2, 2, 3))
print(mat_ones)

[[[1. 1. 1.]
  [1. 1. 1.]]

 [[1. 1. 1.]
  [1. 1. 1.]]]

# 정수 데이터 타입을 균일분포로부터 생성
np.random.randint(10, size = (2, 3))  # 0~9

array([[7, 8, 9],
       [1, 0, 8]])

# seed
# seed 값을 고정하면 동일한 출력 
np.random.seed(10)
np.random.randint(0, 10, size = 10)

array([9, 4, 0, 1, 9, 0, 1, 8, 9, 0])

np.random.choice(5, 10)  # 5가 end point (5 포함x)

array([3, 1, 3, 2, 1, 2, 0, 4, 2, 2])

# 0~4 숫자 중 한 개 선택
# 반환할 샘플의 개수, 10개
# 선택 확률 지정
# 확률은 선택할 수 있는 값의 배열과 길이가 동일해야 합니다.
np.random.choice(5, 10, p = [0.1, 0, 0.3, 0.6, 0])

array([2, 3, 3, 3, 3, 0, 3, 3, 2, 3])

np.linspace(start, stop, num = 50, endpoint = True)

np.linspace(10, 20, 11)

array([10., 11., 12., 13., 14., 15., 16., 17., 18., 19., 20.])

vec = np.random.randint(10, size =10)
print(vec)

[2 8 5 8 0 9 7 7 4 0]

# 처음부터 시작하고, 3번째 인덱스 값 까지 선택해주세요
print(vec[:3])

[2 8 5]

# 역순에서 3번째 값부터 시작하고, 끝가지 선택해주세요
print(vec[-3:])

[7 4 0]

# 역순에서 4번째 값을 선택해주세요
print(vec[-4])

7

# 처음부터 끝까지 역순으로 2단계씩 건너띄어 주세요
print(vec[::-2])

[0 7 9 8 8]

mat = np.random.randint(5, size = (3, 3))
print(mat)

[[1 3 3]
 [0 2 0]
 [4 1 3]]

print(mat[0][1])
print(mat[0, 1])

3
3

# 1~25까지의 정수가 담긴 열 벡터 생성
vec = np.arange(1, 26)
print(vec)
print(len(vec))

[ 1  2  3  4  5  6  7  8  9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24
 25]
25

mat = vec.reshape(5, 5)
print(mat)

[[ 1  2  3  4  5]
 [ 6  7  8  9 10]
 [11 12 13 14 15]
 [16 17 18 19 20]
 [21 22 23 24 25]]

# 세번째 행 전체 선택
print(mat[2])
print(mat[2,:])

[11 12 13 14 15]
[11 12 13 14 15]

# 세번째 열 전체 선택
print(mat[:, 2])

[ 3  8 13 18 23]

# 두번째 행부터 세번째 행
# 두번째 열부터 세번째 열
print(mat[1:3, 1:3])

[[ 7  8]
 [12 13]]

# 행을 역순으로 변환
print(mat[::-1, :])

[[21 22 23 24 25]
 [16 17 18 19 20]
 [11 12 13 14 15]
 [ 6  7  8  9 10]
 [ 1  2  3  4  5]]

# 행렬 전체를 역순으로 변환
print(mat[::-1, ::-1])

[[25 24 23 22 21]
 [20 19 18 17 16]
 [15 14 13 12 11]
 [10  9  8  7  6]
 [ 5  4  3  2  1]]

np.reshape(a, newshape)

a = np.arange(9)
print(a)
print(len(a))
print(a.reshape(3, 3))

[0 1 2 3 4 5 6 7 8]
9
[[0 1 2]
 [3 4 5]
 [6 7 8]]

a_reshape = np.reshape(a, (3, 3))
print(a_reshape)

[[0 1 2]
 [3 4 5]
 [6 7 8]]

# 차원이 맞지 않으면 에러
b = np.arange(10)
b.reshape(3, 3)

---------------------------------------------------------------------------
ValueError                                Traceback (most recent call last)
Cell In[321], line 3
      1 # 차원이 맞지 않으면 에러
      2 b = np.arange(10)
----> 3 b.reshape(3, 3)

ValueError: cannot reshape array of size 10 into shape (3,3)

# -1: 행을 3개로 설정하는데, 열은 자동으로 설정
a = np.arange(9)
print(a)
print(a.reshape(3, -1))

[0 1 2 3 4 5 6 7 8]
[[0 1 2]
 [3 4 5]
 [6 7 8]]

image = np.random.randint(0, 256, size = (32, 32, 3), dtype = np.uint8)
print(image.shape)

(32, 32, 3)

# 이미지 시각화 예시
import matplotlib.pyplot as plt
image = np.random.randint(0, 256, size = (32, 32, 3), dtype = np.uint8)
plt.imshow(image)
plt.show()

# 이미지 데이터 reshape 예시
image.reshape(32*32, 3)

array([[247,  28, 165],
       [155,   9,  53],
       [ 58,   9, 126],
       ...,
       [ 67, 209,  70],
       [100, 195, 102],
       [ 31, 129, 155]], dtype=uint8)

np.where(condition, [x, y])

condition = [True, False, True]
x = [1, 2, 3]
y = [10, 20, 30]

np.where(condition, x, y)

array([ 1, 20,  3])

# np.where()를 반복문으로 구현
result = []
for con, x_value, y_value in zip(condition, x, y):
    if con:
        result.append(x_value)
    else:
        result.append(y_value)
print(result)

[1, 20, 3]

# list comhrehension과 zip()을 사용한 구현
result = [xv if con else yv for con, xv, yv in zip(condition, x, y)]
print(result)

[1, 20, 3]

[Python] [Data Analysis] Pandas를 활용한 서울시 범죄 데이터 전처리 (1)	2023.08.08
[Python] [Data Analysis] Pandas DataFrame 가지고 놀기 (1)	2023.08.07
[Python] [Data Analysis] Pandas 기초 (3)	2023.08.04

Paul's Grit

Paul's Grit

[Python] [Data Analysis] Numpy 기초 본문

[Python] [Data Analysis] Numpy 기초

Numpy¶

선형대수¶

01. ndarray 객체 생성¶

02. np.arang()¶

03. np.zeros(), np.ones()¶

04. np.random()¶

05. np.linspace()¶

06. ndarray 객체에서 데이터 선택¶

행렬에서 슬라이싱 (1)¶

행렬에서 슬라이싱 (2)¶

07. 행을 역순으로 변환¶

08. np.where()¶

'Data Analysis > Pandas' 카테고리의 다른 글

티스토리툴바

« 2025/07 »
일	월	화	수	목	금	토
		1	2	3	4	5
6	7	8	9	10	11	12
13	14	15	16	17	18	19
20	21	22	23	24	25	26
27	28	29	30	31