import tensorflow as tf


x = tf.constant([[1., 2.], [3., 4.]])
print(x)

tf.Tensor(
[[1. 2.]
 [3. 4.]], shape=(2, 2), dtype=float32)


x = tf.ones(shape=(2, 1))
print(x)

tf.Tensor(
[[1.]
 [1.]], shape=(2, 1), dtype=float32)


x = tf.zeros(shape=(2, 1))
print(x)

tf.Tensor(
[[0.]
 [0.]], shape=(2, 1), dtype=float32)


x = tf.random.normal(shape=(3, 1), mean=0., stddev=1.)
print(x)

tf.Tensor(
[[0.4956642 ]
 [0.7919767 ]
 [0.67300016]], shape=(3, 1), dtype=float32)


x = tf.random.uniform(shape=(3, 1), minval=0., maxval=1.)
print(x)

tf.Tensor(
[[0.2889459 ]
 [0.7924731 ]
 [0.12908947]], shape=(3, 1), dtype=float32)


x[0, 0]

<tf.Tensor: shape=(), dtype=float32, numpy=0.2889459>


type(x[0, 0])

tensorflow.python.framework.ops.EagerTensor


import numpy as np

x = np.ones(shape=(2, 2))

x[0, 0] = 0.0
print(x)

[[0. 1.]
 [1. 1.]]


v = tf.Variable(initial_value=tf.random.normal(shape=(3, 1)))
print(v)

<tf.Variable 'Variable:0' shape=(3, 1) dtype=float32, numpy=
array([[ 0.79358006],
       [ 2.0038128 ],
       [-1.7179965 ]], dtype=float32)>


v.assign(tf.ones((3, 1)))

<tf.Variable 'UnreadVariable' shape=(3, 1) dtype=float32, numpy=
array([[1.],
       [1.],
       [1.]], dtype=float32)>


v[0, 0]

<tf.Tensor: shape=(), dtype=float32, numpy=1.0>


type(v[0, 0])

tensorflow.python.framework.ops.EagerTensor


v[0, 0].assign(3.)

<tf.Variable 'UnreadVariable' shape=(3, 1) dtype=float32, numpy=
array([[3.],
       [1.],
       [1.]], dtype=float32)>


v.assign_add(tf.ones((3, 1)))

<tf.Variable 'UnreadVariable' shape=(3, 1) dtype=float32, numpy=
array([[4.],
       [2.],
       [2.]], dtype=float32)>


import numpy as np

a = np.array([[2., 1.],
              [3., -2.]], dtype=np.float32)


a = tf.convert_to_tensor(a)
a += tf.ones((2, 2))
print(a)

tf.Tensor(
[[ 3.  2.]
 [ 4. -1.]], shape=(2, 2), dtype=float32)


b = tf.square(a)
print(b)

tf.Tensor(
[[ 9.  4.]
 [16.  1.]], shape=(2, 2), dtype=float32)


c = tf.sqrt(a)
print(c)

tf.Tensor(
[[1.7320508 1.4142135]
 [2.              nan]], shape=(2, 2), dtype=float32)


a = tf.nn.relu(a)
print(a)

tf.Tensor(
[[3. 2.]
 [4. 0.]], shape=(2, 2), dtype=float32)


c = tf.sqrt(a)
print(c)

tf.Tensor(
[[1.7320508 1.4142135]
 [2.        0.       ]], shape=(2, 2), dtype=float32)


d = b + c
print(d)

tf.Tensor(
[[10.732051   5.4142137]
 [18.         1.       ]], shape=(2, 2), dtype=float32)


e = tf.matmul(a, b)
print(e)

tf.Tensor(
[[59. 14.]
 [36. 16.]], shape=(2, 2), dtype=float32)


e *= a
print(e)

tf.Tensor(
[[177.  28.]
 [144.   0.]], shape=(2, 2), dtype=float32)


input_var = tf.Variable(initial_value=3.)

with tf.GradientTape() as tape:
    result = tf.square(input_var)

gradient = tape.gradient(result, input_var)

print(gradient)

tf.Tensor(6.0, shape=(), dtype=float32)


input_const = tf.constant(3.)

with tf.GradientTape() as tape:
    tape.watch(input_const)
    result = tf.square(input_const)

gradient = tape.gradient(result, input_const)

print(gradient)

tf.Tensor(6.0, shape=(), dtype=float32)


num_samples_per_class = 1000

# 음성 데이터셋
negative_samples = np.random.multivariate_normal(
    mean=[0, 3], cov=[[1, 0.5],[0.5, 1]], size=num_samples_per_class)

# 양성 데이터셋
positive_samples = np.random.multivariate_normal(
    mean=[3, 0], cov=[[1, 0.5],[0.5, 1]], size=num_samples_per_class)


inputs = np.vstack((negative_samples, positive_samples)).astype(np.float32)


targets = np.vstack((np.zeros((num_samples_per_class, 1), dtype="float32"),
                     np.ones((num_samples_per_class, 1), dtype="float32")))


import matplotlib.pyplot as plt

plt.scatter(inputs[:, 0], inputs[:, 1], c=targets[:, 0])
plt.show()


input_dim = 2     # 입력 샘플의 특성이 2개
output_dim = 1    # 하나의 값으로 출력

# 가중치: 무작위 초기화
W = tf.Variable(initial_value=tf.random.uniform(shape=(input_dim, output_dim)))

# 편향: 0으로 초기화
b = tf.Variable(initial_value=tf.zeros(shape=(output_dim,)))


def model(inputs):
    return tf.matmul(inputs, W) + b


def square_loss(targets, predictions):
    per_sample_losses = tf.square(targets - predictions)
    return tf.reduce_mean(per_sample_losses)


learning_rate = 0.1

def training_step(inputs, targets):
    with tf.GradientTape() as tape:
        predictions = model(inputs)
        loss = square_loss(targets, predictions)
    grad_loss_wrt_W, grad_loss_wrt_b = tape.gradient(loss, [W, b])
    W.assign_sub(grad_loss_wrt_W * learning_rate)
    b.assign_sub(grad_loss_wrt_b * learning_rate)
    return loss


for step in range(40):
    loss = training_step(inputs, targets)
    print(f"Loss at step {step}: {loss:.4f}")

Loss at step 0: 5.6682
Loss at step 1: 0.8087
Loss at step 2: 0.2467
Loss at step 3: 0.1531
Loss at step 4: 0.1309
Loss at step 5: 0.1202
Loss at step 6: 0.1118
Loss at step 7: 0.1043
Loss at step 8: 0.0976
Loss at step 9: 0.0914
Loss at step 10: 0.0857
Loss at step 11: 0.0805
Loss at step 12: 0.0758
Loss at step 13: 0.0714
Loss at step 14: 0.0674
Loss at step 15: 0.0638
Loss at step 16: 0.0605
Loss at step 17: 0.0575
Loss at step 18: 0.0547
Loss at step 19: 0.0521
Loss at step 20: 0.0498
Loss at step 21: 0.0477
Loss at step 22: 0.0457
Loss at step 23: 0.0440
Loss at step 24: 0.0423
Loss at step 25: 0.0409
Loss at step 26: 0.0395
Loss at step 27: 0.0382
Loss at step 28: 0.0371
Loss at step 29: 0.0361
Loss at step 30: 0.0351
Loss at step 31: 0.0342
Loss at step 32: 0.0334
Loss at step 33: 0.0327
Loss at step 34: 0.0321
Loss at step 35: 0.0314
Loss at step 36: 0.0309
Loss at step 37: 0.0304
Loss at step 38: 0.0299
Loss at step 39: 0.0295


for step in range(100):
    loss = training_step(inputs, targets)
    if step % 10 == 0:
        print(f"Loss at step {step}: {loss:.4f}")

Loss at step 0: 0.0291
Loss at step 10: 0.0266
Loss at step 20: 0.0256
Loss at step 30: 0.0252
Loss at step 40: 0.0250
Loss at step 50: 0.0250
Loss at step 60: 0.0249
Loss at step 70: 0.0249
Loss at step 80: 0.0249
Loss at step 90: 0.0249


predictions = model(inputs)


plt.scatter(inputs[:, 0], inputs[:, 1], c=predictions[:, 0] > 0.5)
plt.show()


x = np.linspace(-1, 4, 100)
y = - W[0] /  W[1] * x + (0.5 - b) / W[1]

plt.plot(x, y, "-r")
plt.scatter(inputs[:, 0], inputs[:, 1], c=predictions[:, 0] > 0.5)

<matplotlib.collections.PathCollection at 0x230b19b7070>


from tensorflow import keras

class SimpleDense(keras.layers.Layer):

    def __init__(self, units, activation=None):
        super().__init__()
        self.units = units
        self.activation = activation

    def build(self, input_shape):
        input_dim = input_shape[-1]   # 입력 샘플의 특성 수
        self.W = self.add_weight(shape=(input_dim, self.units),
                                 initializer="random_normal")
        self.b = self.add_weight(shape=(self.units,),
                                 initializer="zeros")

    def call(self, inputs):
        y = tf.matmul(inputs, self.W) + self.b
        if self.activation is not None:
            y = self.activation(y)
        return y


my_dense = SimpleDense(units=32, activation=tf.nn.relu)


input_tensor = tf.ones(shape=(1000, 784))


output_tensor = my_dense(input_tensor)

print(output_tensor.shape)

(1000, 32)


model = keras.Sequential([keras.layers.Dense(1)])


model.compile(optimizer="rmsprop",
              loss="mean_squared_error",
              metrics=["accuracy"])


model.compile(optimizer=keras.optimizers.RMSprop(),
              loss=keras.losses.MeanSquaredError(),
              metrics=[keras.metrics.BinaryAccuracy()])


history = model.fit(
    inputs,
    targets,
    epochs=5,
    batch_size=128
)

Epoch 1/5
16/16 [==============================] - 0s 2ms/step - loss: 2.1943 - binary_accuracy: 0.4811
Epoch 2/5
16/16 [==============================] - 0s 3ms/step - loss: 1.9241 - binary_accuracy: 0.5061
Epoch 3/5
16/16 [==============================] - 0s 2ms/step - loss: 1.7317 - binary_accuracy: 0.4967
Epoch 4/5
16/16 [==============================] - 0s 2ms/step - loss: 1.5507 - binary_accuracy: 0.5146
Epoch 5/5
16/16 [==============================] - 0s 2ms/step - loss: 1.4457 - binary_accuracy: 0.5069


history.history

{'loss': [2.093653917312622,
  1.8939359188079834,
  1.7320936918258667,
  1.5835086107254028,
  1.4453810453414917],
 'binary_accuracy': [0.49549999833106995,
  0.49549999833106995,
  0.4959999918937683,
  0.4959999918937683,
  0.4964999854564667]}


indices_permutation = np.random.permutation(len(inputs))


shuffled_inputs = inputs[indices_permutation]
shuffled_targets = targets[indices_permutation]


num_validation_samples = int(0.3 * len(inputs))

val_inputs = shuffled_inputs[:num_validation_samples]
val_targets = shuffled_targets[:num_validation_samples]


training_inputs = shuffled_inputs[num_validation_samples:]
training_targets = shuffled_targets[num_validation_samples:]


history = model.fit(
    training_inputs,
    training_targets,
    epochs=5,
    batch_size=16,
    validation_data=(val_inputs, val_targets)
)

Epoch 1/5
88/88 [==============================] - 1s 11ms/step - loss: 1.0726 - binary_accuracy: 0.4979 - val_loss: 0.8352 - val_binary_accuracy: 0.4950
Epoch 2/5
88/88 [==============================] - 0s 3ms/step - loss: 0.6193 - binary_accuracy: 0.5007 - val_loss: 0.4537 - val_binary_accuracy: 0.4950
Epoch 3/5
88/88 [==============================] - 0s 3ms/step - loss: 0.3114 - binary_accuracy: 0.5050 - val_loss: 0.1972 - val_binary_accuracy: 0.5267
Epoch 4/5
88/88 [==============================] - 0s 3ms/step - loss: 0.1178 - binary_accuracy: 0.8171 - val_loss: 0.0595 - val_binary_accuracy: 0.9867
Epoch 5/5
88/88 [==============================] - 0s 3ms/step - loss: 0.0371 - binary_accuracy: 0.9950 - val_loss: 0.0259 - val_binary_accuracy: 1.0000


history.history

{'loss': [1.072609543800354,
  0.6192675828933716,
  0.3113844394683838,
  0.11782326549291611,
  0.037062548100948334],
 'binary_accuracy': [0.49785715341567993,
  0.5007143020629883,
  0.5049999952316284,
  0.8171428442001343,
  0.9950000047683716],
 'val_loss': [0.8351580500602722,
  0.4537375867366791,
  0.19723956286907196,
  0.05950124189257622,
  0.025946015492081642],
 'val_binary_accuracy': [0.4950000047683716,
  0.4950000047683716,
  0.5266666412353516,
  0.9866666793823242,
  1.0]}


loss_and_metrics = model.evaluate(val_inputs, val_targets, batch_size=128)

5/5 [==============================] - 0s 0s/step - loss: 0.0259 - binary_accuracy: 1.0000


predictions = model(val_inputs)
print(predictions[:10])

tf.Tensor(
[[ 0.08220395]
 [-0.1380057 ]
 [ 0.13853893]
 [ 0.14018369]
 [ 1.109943  ]
 [ 0.6667064 ]
 [ 0.06574634]
 [ 0.5064674 ]
 [ 0.15613529]
 [ 0.88908464]], shape=(10, 1), dtype=float32)


predictions = model.predict(val_inputs, batch_size=128)
print(predictions[:10])

[[ 0.08220395]
 [-0.1380057 ]
 [ 0.13853893]
 [ 0.14018369]
 [ 1.109943  ]
 [ 0.6667064 ]
 [ 0.06574634]
 [ 0.5064674 ]
 [ 0.15613529]
 [ 0.88908464]]

3장 케라스와 텐서플로우¶

주요 내용¶

3.5 텐서플로우 기본 사용법¶

신경망 모델 훈련 핵심 1¶

텐서플로우 기본 API 활용법¶

상수 텐서¶

변수 텐서¶

텐서 연산¶

`GradientTape` API (다시 살펴 보기)¶

저수준 선형 분류 신경망 구현¶

데이터셋 생성¶

가중치 변수 텐서 생성¶

예측 모델(함수) 선언¶

손실 함수: 평균 제곱 오차(MSE)¶

훈련 단계¶

배치 훈련¶

예측¶

3.6 케라스의 핵심 API 이해¶

신경망 모델 훈련 핵심 2¶

층¶

`Layer` 클래스¶

`Dense` 클래스 직접 구현하기¶

층에서 모델로¶

가설 공간¶

망 구성방식¶

모델 컴파일¶

`fit()` 메서드 작동법¶

검증 세트 활용¶

모델 활용¶

3장 케라스와 텐서플로우¶

주요 내용¶

3.5 텐서플로우 기본 사용법¶

신경망 모델 훈련 핵심 1¶

텐서플로우 기본 API 활용법¶

상수 텐서¶

변수 텐서¶

텐서 연산¶

GradientTape API (다시 살펴 보기)¶

저수준 선형 분류 신경망 구현¶

데이터셋 생성¶

가중치 변수 텐서 생성¶

예측 모델(함수) 선언¶

손실 함수: 평균 제곱 오차(MSE)¶

훈련 단계¶

배치 훈련¶

예측¶

3.6 케라스의 핵심 API 이해¶

신경망 모델 훈련 핵심 2¶

층¶

Layer 클래스¶

Dense 클래스 직접 구현하기¶

층에서 모델로¶

가설 공간¶

망 구성방식¶

모델 컴파일¶

fit() 메서드 작동법¶

검증 세트 활용¶

모델 활용¶

`GradientTape` API (다시 살펴 보기)¶

`Layer` 클래스¶

`Dense` 클래스 직접 구현하기¶

`fit()` 메서드 작동법¶