YunYang1994
diff --git a/‎7-Utils/multi_gpu_train.py‎
Lines changed: 119 additions & 0 deletions b/‎7-Utils/multi_gpu_train.py‎
Lines changed: 119 additions & 0 deletions
diff --git a/‎README.md‎
Lines changed: 2 additions & 3 deletions b/‎README.md‎
Lines changed: 2 additions & 3 deletions
@@ -0,0 +1,119 @@
+#! /usr/bin/env python
+# coding=utf-8
+#================================================================
+# Copyright (C) 2020 * Ltd. All rights reserved.
+#
+# Editor : VIM
+# File name : multi_gpu_train.py
+# Author : YunYang1994
+# Created date: 2020-02-02 22:14:30
+# Description :
+#
+#================================================================
+
+import tensorflow as tf
+from tqdm import tqdm
+from tensorflow.keras.preprocessing.image import ImageDataGenerator
+from tensorflow.keras import applications
+from tensorflow.keras.optimizers import SGD
+os.environ["CUDA_VISIBLE_DEVICES"] = "0,2,3"
+
+BATCH_SIZE = 384 # 3 GPU and 128 batch size per GPU
+EPOCHS = 30
+NUM_CLASS = 10
+EMB_SIZE = 512 # Embedding Size
+GPU_SIZE = 30 # (G) MemorySIZE per GPU
+IMG_SIZE = 112 # Input Image Size
+
+train_datagen = ImageDataGenerator(
+ rescale=1./255,
+ shear_range=0.2,
+ zoom_range=0.2,
+ horizontal_flip=True)
+
+train_generator = train_datagen.flow_from_directory(
+ '/home/yyang/mnist/train',
+ target_size=(IMG_SIZE, IMG_SIZE),
+ batch_size=BATCH_SIZE,
+ class_mode='categorical')
+
+tf.debugging.set_log_device_placement(True)
+gpus = tf.config.experimental.list_physical_devices('GPU')
+
+for gpu in gpus:
+ tf.config.experimental.set_virtual_device_configuration(
+ gpu, [tf.config.experimental.VirtualDeviceConfiguration(memory_limit=GPU_SIZE*1024)]
+ )
+logical_gpus = tf.config.experimental.list_logical_devices('GPU')
+print(len(gpus), "Physical GPU,", len(logical_gpus), "Logical GPUs")
+
+tf.debugging.set_log_device_placement(True)
+strategy = tf.distribute.MirroredStrategy()
+
+# Defining Model
+with strategy.scope():
+ model = applications.mobilenet_v2.MobileNetV2(include_top=False, weights=None,
+ input_shape=(IMG_SIZE,IMG_SIZE,3))
+ x = tf.keras.layers.Input(shape=(IMG_SIZE,IMG_SIZE,3))
+ y = model(x)
+ y = tf.keras.layers.AveragePooling2D()(y)
+ y = tf.keras.layers.Flatten()(y)
+ y = tf.keras.layers.Dense(EMB_SIZE, activation=None)(y)
+ y = tf.keras.layers.Dense(NUM_CLASS, activation='softmax')(y)
+ model = tf.keras.models.Model(inputs=x, outputs=y)
+
+ optimizer = tf.keras.optimizers.Adam(0.001)
+ checkpoint = tf.train.Checkpoint(optimizer=optimizer, model=model)
+
+# Defining Loss and Metrics
+with strategy.scope():
+ loss_object = tf.keras.losses.CategoricalCrossentropy(
+ reduction=tf.keras.losses.Reduction.NONE
+ )
+ def compute_loss(labels, predictions):
+ per_example_loss = loss_object(labels, predictions)
+ return tf.nn.compute_average_loss(per_example_loss, global_batch_size=BATCH_SIZE)
+
+ train_accuracy = tf.keras.metrics.CategoricalAccuracy(
+ name='train_accuracy'
+ )
+
+# Defining Training Step
+with strategy.scope():
+ def train_step(inputs):
+ images, labels = inputs
+
+ with tf.GradientTape() as tape:
+ predictions = model(images, training=True)
+ loss = compute_loss(labels, predictions)
+
+ gradients = tape.gradient(loss, model.trainable_variables)
+ optimizer.apply_gradients(zip(gradients, model.trainable_variables))
+ train_accuracy.update_state(labels, predictions)
+ return loss
+
+# Defining Training Loops
+with strategy.scope():
+ @tf.function
+ def distributed_train_step(dataset_inputs):
+ per_replica_losses = strategy.experimental_run_v2(train_step,
+ args=(dataset_inputs,))
+ return strategy.reduce(tf.distribute.ReduceOp.SUM, per_replica_losses,
+ axis=None)
+ for epoch in range(EPOCHS):
+ batchs_per_epoch = len(train_generator)
+ train_dataset = iter(train_generator)
+
+ with tqdm(total=batchs_per_epoch,
+ desc="Epoch %2d/%2d" %(epoch+1, EPOCHS)) as pbar:
+ for _ in range(batchs_per_epoch):
+ batch_loss = distributed_train_step(next(train_dataset))
+ batch_acc = train_accuracy.result()
+ pbar.set_postfix({'loss' : '%.4f' %batch_loss,
+ 'accuracy' : '%.6f' %batch_acc})
+ train_accuracy.reset_states()
+ pbar.update(1)
+
+model.save_weights("model.h5")
+
+
@@ -114,6 +114,5 @@ This tutorial was designed for easily diving into TensorFlow2.0. it includes bo
 - **DCGAN** ([notebook](https://nbviewer.jupyter.org/github/YunYang1994/tensorflow2.0-examples/blob/master/6-Generative_Adversarial_Networks/dcgan.ipynb)) ([code](6-Generative_Adversarial_Networks/dcgan.py))([paper](https://arxiv.org/pdf/1511.06434.pdf)). Deep Convolutional Generative Adversarial Network.
 - **Pix2Pix** ([notebook](https://nbviewer.jupyter.org/github/YunYang1994/tensorflow2.0-examples/blob/master/6-Generative_Adversarial_Networks/Pix2Pix.ipynb)) ([code](6-Generative_Adversarial_Networks/Pix2Pix.py))([paper](https://arxiv.org/pdf/1611.07004.pdf)). Image-to-Image Translation with Conditional Adversarial Networks.
 
-#### 7 - Reinforcement Learning
-
-- **DQN** ([notebook](6-Reinforcement_Learning/YOLOV2.ipynb)) ([code](6-Reinforcement_Learning/YOLOV2.py)). deep Q-network (DQN).
+#### 7 - Utils
+- **Multiple GPU Training** ([code](7-Utils/multi_gpu_train.py)). Use multiple GPU to train your model.