| #!/usr/bin/python | |
| # The contents of this file are in the public domain. See LICENSE_FOR_EXAMPLE_PROGRAMS.txt | |
| # | |
| # This example shows how to use dlib's face recognition tool for clustering using chinese_whispers. | |
| # This is useful when you have a collection of photographs which you know are linked to | |
| # a particular person, but the person may be photographed with multiple other people. | |
| # In this example, we assume the largest cluster will contain photos of the common person in the | |
| # collection of photographs. Then, we save extracted images of the face in the largest cluster in | |
| # a 150x150 px format which is suitable for jittering and loading to perform metric learning (as shown | |
| # in the dnn_metric_learning_on_images_ex.cpp example. | |
| # https://github.com/davisking/dlib/blob/master/examples/dnn_metric_learning_on_images_ex.cpp | |
| # | |
| # COMPILING/INSTALLING THE DLIB PYTHON INTERFACE | |
| # You can install dlib using the command: | |
| # pip install dlib | |
| # | |
| # Alternatively, if you want to compile dlib yourself then go into the dlib | |
| # root folder and run: | |
| # python setup.py install | |
| # | |
| # Compiling dlib should work on any operating system so long as you have | |
| # CMake installed. On Ubuntu, this can be done easily by running the | |
| # command: | |
| # sudo apt-get install cmake | |
| # | |
| # Also note that this example requires Numpy which can be installed | |
| # via the command: | |
| # pip install numpy | |
| import sys | |
| import os | |
| import dlib | |
| import glob | |
| if len(sys.argv) != 5: | |
| print( | |
| "Call this program like this:\n" | |
| " ./face_clustering.py shape_predictor_5_face_landmarks.dat dlib_face_recognition_resnet_model_v1.dat ../examples/faces output_folder\n" | |
| "You can download a trained facial shape predictor and recognition model from:\n" | |
| " http://dlib.net/files/shape_predictor_5_face_landmarks.dat.bz2\n" | |
| " http://dlib.net/files/dlib_face_recognition_resnet_model_v1.dat.bz2") | |
| exit() | |
| predictor_path = sys.argv[1] | |
| face_rec_model_path = sys.argv[2] | |
| faces_folder_path = sys.argv[3] | |
| output_folder_path = sys.argv[4] | |
| # Load all the models we need: a detector to find the faces, a shape predictor | |
| # to find face landmarks so we can precisely localize the face, and finally the | |
| # face recognition model. | |
| detector = dlib.get_frontal_face_detector() | |
| sp = dlib.shape_predictor(predictor_path) | |
| facerec = dlib.face_recognition_model_v1(face_rec_model_path) | |
| descriptors = [] | |
| images = [] | |
| # Now find all the faces and compute 128D face descriptors for each face. | |
| for f in glob.glob(os.path.join(faces_folder_path, "*.jpg")): | |
| print("Processing file: {}".format(f)) | |
| img = dlib.load_rgb_image(f) | |
| # Ask the detector to find the bounding boxes of each face. The 1 in the | |
| # second argument indicates that we should upsample the image 1 time. This | |
| # will make everything bigger and allow us to detect more faces. | |
| dets = detector(img, 1) | |
| print("Number of faces detected: {}".format(len(dets))) | |
| # Now process each face we found. | |
| for k, d in enumerate(dets): | |
| # Get the landmarks/parts for the face in box d. | |
| shape = sp(img, d) | |
| # Compute the 128D vector that describes the face in img identified by | |
| # shape. | |
| face_descriptor = facerec.compute_face_descriptor(img, shape) | |
| descriptors.append(face_descriptor) | |
| images.append((img, shape)) | |
| # Now let's cluster the faces. | |
| labels = dlib.chinese_whispers_clustering(descriptors, 0.5) | |
| num_classes = len(set(labels)) | |
| print("Number of clusters: {}".format(num_classes)) | |
| # Find biggest class | |
| biggest_class = None | |
| biggest_class_length = 0 | |
| for i in range(0, num_classes): | |
| class_length = len([label for label in labels if label == i]) | |
| if class_length > biggest_class_length: | |
| biggest_class_length = class_length | |
| biggest_class = i | |
| print("Biggest cluster id number: {}".format(biggest_class)) | |
| print("Number of faces in biggest cluster: {}".format(biggest_class_length)) | |
| # Find the indices for the biggest class | |
| indices = [] | |
| for i, label in enumerate(labels): | |
| if label == biggest_class: | |
| indices.append(i) | |
| print("Indices of images in the biggest cluster: {}".format(str(indices))) | |
| # Ensure output directory exists | |
| if not os.path.isdir(output_folder_path): | |
| os.makedirs(output_folder_path) | |
| # Save the extracted faces | |
| print("Saving faces in largest cluster to output folder...") | |
| for i, index in enumerate(indices): | |
| img, shape = images[index] | |
| file_path = os.path.join(output_folder_path, "face_" + str(i)) | |
| # The size and padding arguments are optional with default size=150x150 and padding=0.25 | |
| dlib.save_face_chip(img, shape, file_path, size=150, padding=0.25) | |