faceit_live3/faceit_live.py

import imageio
import numpy as np
import pandas as pd
from skimage.transform import resize
import warnings
import sys
import cv2
import time
import PIL.Image as Image
import PIL.ImageFilter
import io
from io import BytesIO
import pyautogui
import os
import glob
from argparse import Namespace
import argparse
import timeit
import torch
warnings.filterwarnings("ignore")

############## setup ####
stream = True
media_path = './media/'
model_path = 'model/'

parser = argparse.ArgumentParser()
parser.add_argument('--webcam_id', type = int, default = 0)
parser.add_argument('--stream_id', type = int, default = 1)
parser.add_argument('--gpu_id', type = int, default = 0)
parser.add_argument('--system', type = str, default = "win")

args = parser.parse_args()
webcam_id = args.webcam_id
gpu_id = args.gpu_id

webcam_height = 480
webcam_width = 640
screen_width, screen_height = pyautogui.size()
img_shape = [256, 256, 0]

system = args.system
if system=="linux":
    print("Linux version, importing FakeWebCam")
    import pyfakewebcam


stream_id = args.stream_id
first_order_path = 'first-order-model/'
sys.path.insert(0,first_order_path)
reset = True

# import methods from first-order-model
import demo
from demo import load_checkpoints, make_animation, tqdm

# prevent tqdm from outputting to console
demo.tqdm = lambda *i, **kwargs: i[0]

print("CUDA is available: ",torch.cuda.is_available())
if (torch.cuda.is_available()):
    torch.cuda.device("cuda:" + str(gpu_id))
    print("Device Name:",torch.cuda.get_device_name(gpu_id))
    print("Device Count:",torch.cuda.device_count())
    print("CUDA: ",torch.version.cuda)
    print("cuDNN",torch.backends.cudnn.version())
    print("Device",torch.cuda.current_device())


img_list = []
print("Scanning /media folder for images to use...")
for filename in os.listdir(media_path):
    if filename.endswith(".jpg") or filename.endswith(".jpeg") or filename.endswith(".png"):
        img_list.append(os.path.join(media_path, filename))
        print(os.path.join(media_path, filename))

#print(img_list, len(img_list))


############## end setup ####

def main():
    global source_image
    source_image =  readnextimage(0)

    # start streaming
    if system=="linux":
        camera = pyfakewebcam.FakeWebcam(f'/dev/video{stream_id}', webcam_width, webcam_height)
        camera.print_capabilities()
        print(f"Fake webcam created on /dev/video{stream_id}. Use Firefox and join a Google Meeting to test.")

    # capture webcam
    video_capture = cv2.VideoCapture(webcam_id)
    time.sleep(1)
    width = video_capture.get(3)  # float
    height = video_capture.get(4) # float
    print("webcam dimensions = {} x {}".format(width,height))

    # load models
    previous = None
    net = load_face_model()
    generator, kp_detector = demo.load_checkpoints(config_path=f'{first_order_path}config/vox-adv-256.yaml', checkpoint_path=f'{model_path}/vox-adv-cpk.pth.tar')

    
    # create windows
    cv2.namedWindow('Face', cv2.WINDOW_GUI_NORMAL) # extracted face
    cv2.moveWindow('Face', int(screen_width/2)-150, 100)
    cv2.resizeWindow('Face', 256,256)

    cv2.namedWindow('DeepFake', cv2.WINDOW_GUI_NORMAL) # face transformation
    cv2.moveWindow('DeepFake', int(screen_width/2)+150, 100)
    cv2.resizeWindow('DeepFake', int(img_shape[1] / img_shape[0] * 256), 256)


    cv2.namedWindow('Stream', cv2.WINDOW_GUI_NORMAL) # rendered to fake webcam
    cv2.moveWindow('Stream', int(screen_width/2)-int(webcam_width/2), 400)
    cv2.resizeWindow('Stream', webcam_width,webcam_height)

    
    print("Press C to center Webcam, Press B/N for previous/next image in media directory, T to alter between relative and absolute transformation, Q to quit")
    x1,y1,x2,y2 = [0,0,0,0]
    relative = True
    while True:
        ret, frame = video_capture.read()
        frame = cv2.resize(frame, (640, 480))
        frame = cv2.flip(frame,1)

        if (previous is None or reset is True):
            x1,y1,x2,y2 = find_face_cut(net,frame)
            previous = cut_face_window(x1,y1,x2,y2,frame)
            reset = False
            #cv2.imshow('Previous',previous)


        curr_face = cut_face_window(x1,y1,x2,y2,frame)
        #cv2.imshow('Curr Face',curr_face)
        #cv2.imshow('Source Image',source_image)
        deep_fake = process_image(source_image,previous,curr_face,net, generator, kp_detector, relative)
        deep_fake = cv2.cvtColor(deep_fake, cv2.COLOR_RGB2BGR) 

        #cv2.imshow('Webcam', frame) - get face
        cv2.imshow('Face', curr_face)
        cv2.imshow('DeepFake', deep_fake)


        rgb = cv2.resize(deep_fake,(int(img_shape[1] / img_shape[0] * 480),480))
        # pad image 
        x_border = int((640-(img_shape[1] / img_shape[0] * 480))/2)
        y_border = int((480-(img_shape[0] / img_shape[1] * 640))/2)
        stream_v = cv2.copyMakeBorder(rgb, y_border if y_border >=0 else 0, y_border if y_border >=0 else 0, x_border if x_border >=0 else 0, x_border if x_border >=0 else 0, cv2.BORDER_CONSTANT)
        cv2.imshow('Stream',stream_v)
        
        #time.sleep(1/30.0)
        stream_v = cv2.flip(stream_v,1)
        stream_v = cv2.cvtColor(stream_v, cv2.COLOR_BGR2RGB)
        stream_v = (stream_v*255).astype(np.uint8)

        # stream to fakewebcam
        if system=="linux":
            #print("output to fakecam")
            camera.schedule_frame(stream_v)

        k = cv2.waitKey(1) 
        # Hit 'q' on the keyboard to quit!
        if k & 0xFF == ord('q'):
            print("Quiting")
            video_capture.release()
            break
        elif k==ord('c'):
            # center
            print("Centering the image")
            reset = True
        elif k==ord('b'):
            # previous image
            print("Loading previous image")
            source_image = readpreviousimage()
            reset = True
        elif k==ord('n'):
            # next image
            print("Loading next image")
            source_image = readnextimage()
            reset = True
        elif k==ord('t'):
            # rotate 
            relative = not relative
            print("Changing transform mode")


    cv2.destroyAllWindows()
    exit()


# transform face with first-order-model
def process_image(source_image,base,current,net, generator,kp_detector,relative):
    predictions = make_animation(source_image, [base,current], generator, kp_detector, relative=relative, adapt_movement_scale=False, cpu=False)
    #print("Device",torch.cuda.current_device())
    #print("Device Name:",torch.cuda.get_device_name(gpu_id))
    # predictions = [1]# predictions[..., ::-1]
    # predictions = (np.clip(predictions, 0, 1) * 255).astype(np.uint8)
    return predictions[1]

def load_face_model():
    modelFile = f"{model_path}/res10_300x300_ssd_iter_140000.caffemodel"
    configFile = f"{model_path}./deploy.prototxt.txt"
    net = cv2.dnn.readNetFromCaffe(configFile, modelFile)
    return net

def cut_face_window(x1,y1,x2,y2,frame):
    cut_x1 = x1
    cut_y1 = y1
    cut_x2 = x2
    cut_y2 = y2
    frame = frame[cut_y1:cut_y2,cut_x1:cut_x2]
    face = resize(frame, (256, 256))[..., :3]
    
    return face

# find the face in webcam stream and center a 256x256 window
def find_face_cut(net,face,previous=False):
    blob = cv2.dnn.blobFromImage(face, 1.0, (300, 300), [104, 117, 123], False, False)
    frameWidth = 640
    frameHeight = 480
    net.setInput(blob)
    detections = net.forward()
    bboxes = []
    face_found = False
    for i in range(detections.shape[2]):
        confidence = detections[0, 0, i, 2]
        if confidence > 0.8:
            face_found = True
            x1 = int(detections[0, 0, i, 3] * frameWidth)
            y1 = int(detections[0, 0, i, 4] * frameHeight)
            x2 = int(detections[0, 0, i, 5] * frameWidth)
            y2 = int(detections[0, 0, i, 6] * frameHeight)

            face_margin_w = int(256 - (abs(x1-x2) -.5))
            face_margin_h = int(256 - (abs(y1-y2) -.5))

            cut_x1 = (x1 - int(face_margin_w/2))
            if cut_x1<0: cut_x1=0
            cut_y1 = y1 - int(2*face_margin_h/3)
            if cut_y1<0: cut_y1=0
            cut_x2 = x2 + int(face_margin_w/2)
            cut_y2 = y2 + int(face_margin_h/3)

    if not face_found:
        print("No face detected in video")
        # let's just use the middle section of the image
        cut_x1,cut_y1,cut_x2,cut_y2 = 112,192,368,448
    else:
        print(f'Found face at: ({x1,y1}) ({x2},{y2} width:{abs(x2-x1)} height: {abs(y2-y1)})')
        print(f'Cutting at: ({cut_x1,cut_y1}) ({cut_x2},{cut_y2} width:{abs(cut_x2-cut_x1)} height: {abs(cut_y2-cut_y1)})')


    return cut_x1,cut_y1,cut_x2,cut_y2

def readimage():
    global img_list,img_shape
    img = imageio.imread(img_list[pos])
    img_shape = img.shape
    cv2.resizeWindow('DeepFake', int(img_shape[1] / img_shape[0] * 256), 256)
    img = resize(img, (256, 256))[..., :3]
    return img

def readpreviousimage():
    global pos
    if pos<len(img_list)-1:
        pos=pos-1
    else:
        pos=0
    return readimage()

def readnextimage(position=-1):
    global pos
    if (position != -1):
        pos = position
    else:
        if pos<len(img_list)-1:
            pos=pos+1
        else:
            pos=0
    return readimage()

main()
First Commit 4 years ago			`import imageio`
			`import numpy as np`
			`import pandas as pd`
			`from skimage.transform import resize`
			`import warnings`
			`import sys`
			`import cv2`
			`import time`
			`import PIL.Image as Image`
			`import PIL.ImageFilter`
			`import io`
			`from io import BytesIO`
			`import pyautogui`
			`import os`
			`import glob`
Correct readme and read command line parameters 4 years ago			`from argparse import Namespace`
			`import argparse`
small corrections to readme 4 years ago			`import timeit`
added instructions on how to use Windows + OBS 4 years ago			`import torch`
First Commit 4 years ago			`warnings.filterwarnings("ignore")`

			`############## setup ####`
			`stream = True`
			`media_path = './media/'`
			`model_path = 'model/'`
Correct readme and read command line parameters 4 years ago
			`parser = argparse.ArgumentParser()`
added instructions on how to use Windows + OBS 4 years ago			`parser.add_argument('--webcam_id', type = int, default = 0)`
Correct readme and read command line parameters 4 years ago			`parser.add_argument('--stream_id', type = int, default = 1)`
added instructions on how to use Windows + OBS 4 years ago			`parser.add_argument('--gpu_id', type = int, default = 0)`
			`parser.add_argument('--system', type = str, default = "win")`
Correct readme and read command line parameters 4 years ago
added instructions on how to use Windows + OBS 4 years ago			`args = parser.parse_args()`
Correct readme and read command line parameters 4 years ago			`webcam_id = args.webcam_id`
added instructions on how to use Windows + OBS 4 years ago			`gpu_id = args.gpu_id`

First Commit 4 years ago			`webcam_height = 480`
			`webcam_width = 640`
			`screen_width, screen_height = pyautogui.size()`
Automatically adjust window size and borders 4 years ago			`img_shape = [256, 256, 0]`
First Commit 4 years ago
added instructions on how to use Windows + OBS 4 years ago			`system = args.system`
			`if system=="linux":`
more details on the readme file 4 years ago			`print("Linux version, importing FakeWebCam")`
added instructions on how to use Windows + OBS 4 years ago			`import pyfakewebcam`


Correct readme and read command line parameters 4 years ago			`stream_id = args.stream_id`
First Commit 4 years ago			`first_order_path = 'first-order-model/'`
			`sys.path.insert(0,first_order_path)`
			`reset = True`

			`# import methods from first-order-model`
			`import demo`
			`from demo import load_checkpoints, make_animation, tqdm`

			`# prevent tqdm from outputting to console`
			`demo.tqdm = lambda i, *kwargs: i[0]`

added instructions on how to use Windows + OBS 4 years ago			`print("CUDA is available: ",torch.cuda.is_available())`
			`if (torch.cuda.is_available()):`
			`torch.cuda.device("cuda:" + str(gpu_id))`
			`print("Device Name:",torch.cuda.get_device_name(gpu_id))`
			`print("Device Count:",torch.cuda.device_count())`
			`print("CUDA: ",torch.version.cuda)`
			`print("cuDNN",torch.backends.cudnn.version())`
			`print("Device",torch.cuda.current_device())`



First Commit 4 years ago			`img_list = []`
added instructions on how to use Windows + OBS 4 years ago			`print("Scanning /media folder for images to use...")`
First Commit 4 years ago			`for filename in os.listdir(media_path):`
			`if filename.endswith(".jpg") or filename.endswith(".jpeg") or filename.endswith(".png"):`
			`img_list.append(os.path.join(media_path, filename))`
			`print(os.path.join(media_path, filename))`

added instructions on how to use Windows + OBS 4 years ago			`#print(img_list, len(img_list))`
First Commit 4 years ago




			`############## end setup ####`

			`def main():`
			`global source_image`
			`source_image = readnextimage(0)`

			`# start streaming`
added instructions on how to use Windows + OBS 4 years ago			`if system=="linux":`
			`camera = pyfakewebcam.FakeWebcam(f'/dev/video{stream_id}', webcam_width, webcam_height)`
			`camera.print_capabilities()`
			`print(f"Fake webcam created on /dev/video{stream_id}. Use Firefox and join a Google Meeting to test.")`
First Commit 4 years ago
			`# capture webcam`
			`video_capture = cv2.VideoCapture(webcam_id)`
			`time.sleep(1)`
			`width = video_capture.get(3) # float`
			`height = video_capture.get(4) # float`
			`print("webcam dimensions = {} x {}".format(width,height))`

			`# load models`
			`previous = None`
			`net = load_face_model()`
			`generator, kp_detector = demo.load_checkpoints(config_path=f'{first_order_path}config/vox-adv-256.yaml', checkpoint_path=f'{model_path}/vox-adv-cpk.pth.tar')`


			`# create windows`
			`cv2.namedWindow('Face', cv2.WINDOW_GUI_NORMAL) # extracted face`
			`cv2.moveWindow('Face', int(screen_width/2)-150, 100)`
			`cv2.resizeWindow('Face', 256,256)`

			`cv2.namedWindow('DeepFake', cv2.WINDOW_GUI_NORMAL) # face transformation`
			`cv2.moveWindow('DeepFake', int(screen_width/2)+150, 100)`
Also resize first image 4 years ago			`cv2.resizeWindow('DeepFake', int(img_shape[1] / img_shape[0] * 256), 256)`
First Commit 4 years ago

			`cv2.namedWindow('Stream', cv2.WINDOW_GUI_NORMAL) # rendered to fake webcam`
			`cv2.moveWindow('Stream', int(screen_width/2)-int(webcam_width/2), 400)`
Automatically adjust window size and borders 4 years ago			`cv2.resizeWindow('Stream', webcam_width,webcam_height)`
First Commit 4 years ago

Updated console message 4 years ago			`print("Press C to center Webcam, Press B/N for previous/next image in media directory, T to alter between relative and absolute transformation, Q to quit")`
New keypress option 'T' to toggle between transformation modes 4 years ago			`x1,y1,x2,y2 = [0,0,0,0]`
			`relative = True`
First Commit 4 years ago			`while True:`
			`ret, frame = video_capture.read()`
			`frame = cv2.resize(frame, (640, 480))`
			`frame = cv2.flip(frame,1)`

			`if (previous is None or reset is True):`
			`x1,y1,x2,y2 = find_face_cut(net,frame)`
New keypress option 'T' to toggle between transformation modes 4 years ago			`previous = cut_face_window(x1,y1,x2,y2,frame)`
First Commit 4 years ago			`reset = False`
New keypress option 'T' to toggle between transformation modes 4 years ago			`#cv2.imshow('Previous',previous)`

First Commit 4 years ago
New keypress option 'T' to toggle between transformation modes 4 years ago			`curr_face = cut_face_window(x1,y1,x2,y2,frame)`
			`#cv2.imshow('Curr Face',curr_face)`
			`#cv2.imshow('Source Image',source_image)`
			`deep_fake = process_image(source_image,previous,curr_face,net, generator, kp_detector, relative)`
First Commit 4 years ago			`deep_fake = cv2.cvtColor(deep_fake, cv2.COLOR_RGB2BGR)`

			`#cv2.imshow('Webcam', frame) - get face`
New keypress option 'T' to toggle between transformation modes 4 years ago			`cv2.imshow('Face', curr_face)`
First Commit 4 years ago			`cv2.imshow('DeepFake', deep_fake)`


Automatically adjust window size and borders 4 years ago			`rgb = cv2.resize(deep_fake,(int(img_shape[1] / img_shape[0] * 480),480))`
First Commit 4 years ago			`# pad image`
Automatically adjust window size and borders 4 years ago			`x_border = int((640-(img_shape[1] / img_shape[0] * 480))/2)`
			`y_border = int((480-(img_shape[0] / img_shape[1] * 640))/2)`
			`stream_v = cv2.copyMakeBorder(rgb, y_border if y_border >=0 else 0, y_border if y_border >=0 else 0, x_border if x_border >=0 else 0, x_border if x_border >=0 else 0, cv2.BORDER_CONSTANT)`
First Commit 4 years ago			`cv2.imshow('Stream',stream_v)`

			`#time.sleep(1/30.0)`
			`stream_v = cv2.flip(stream_v,1)`
			`stream_v = cv2.cvtColor(stream_v, cv2.COLOR_BGR2RGB)`
			`stream_v = (stream_v*255).astype(np.uint8)`

			`# stream to fakewebcam`
added instructions on how to use Windows + OBS 4 years ago			`if system=="linux":`
more details on the readme file 4 years ago			`#print("output to fakecam")`
added instructions on how to use Windows + OBS 4 years ago			`camera.schedule_frame(stream_v)`
First Commit 4 years ago
			`k = cv2.waitKey(1)`
			`# Hit 'q' on the keyboard to quit!`
			`if k & 0xFF == ord('q'):`
Giving more keypress feedback on the console. 4 years ago			`print("Quiting")`
First Commit 4 years ago			`video_capture.release()`
			`break`
			`elif k==ord('c'):`
			`# center`
Updated console message 4 years ago			`print("Centering the image")`
First Commit 4 years ago			`reset = True`
Key B for previous image 4 years ago			`elif k==ord('b'):`
Updated console message 4 years ago			`# previous image`
Key B for previous image 4 years ago			`print("Loading previous image")`
			`source_image = readpreviousimage()`
			`reset = True`
First Commit 4 years ago			`elif k==ord('n'):`
Updated console message 4 years ago			`# next image`
Key B for previous image 4 years ago			`print("Loading next image")`
First Commit 4 years ago			`source_image = readnextimage()`
			`reset = True`
new t option 4 years ago			`elif k==ord('t'):`
Giving more keypress feedback on the console. 4 years ago			`# rotate`
New keypress option 'T' to toggle between transformation modes 4 years ago			`relative = not relative`
Giving more keypress feedback on the console. 4 years ago			`print("Changing transform mode")`

First Commit 4 years ago
			`cv2.destroyAllWindows()`
			`exit()`


			`# transform face with first-order-model`
New keypress option 'T' to toggle between transformation modes 4 years ago			`def process_image(source_image,base,current,net, generator,kp_detector,relative):`
added instructions on how to use Windows + OBS 4 years ago			`predictions = make_animation(source_image, [base,current], generator, kp_detector, relative=relative, adapt_movement_scale=False, cpu=False)`
			`#print("Device",torch.cuda.current_device())`
			`#print("Device Name:",torch.cuda.get_device_name(gpu_id))`
New keypress option 'T' to toggle between transformation modes 4 years ago			`# predictions = [1]# predictions[..., ::-1]`
			`# predictions = (np.clip(predictions, 0, 1) * 255).astype(np.uint8)`
First Commit 4 years ago			`return predictions[1]`

			`def load_face_model():`
			`modelFile = f"{model_path}/res10_300x300_ssd_iter_140000.caffemodel"`
			`configFile = f"{model_path}./deploy.prototxt.txt"`
			`net = cv2.dnn.readNetFromCaffe(configFile, modelFile)`
			`return net`

New keypress option 'T' to toggle between transformation modes 4 years ago			`def cut_face_window(x1,y1,x2,y2,frame):`
First Commit 4 years ago			`cut_x1 = x1`
			`cut_y1 = y1`
			`cut_x2 = x2`
			`cut_y2 = y2`
New keypress option 'T' to toggle between transformation modes 4 years ago			`frame = frame[cut_y1:cut_y2,cut_x1:cut_x2]`
			`face = resize(frame, (256, 256))[..., :3]`
First Commit 4 years ago
			`return face`

			`# find the face in webcam stream and center a 256x256 window`
			`def find_face_cut(net,face,previous=False):`
			`blob = cv2.dnn.blobFromImage(face, 1.0, (300, 300), [104, 117, 123], False, False)`
			`frameWidth = 640`
			`frameHeight = 480`
			`net.setInput(blob)`
			`detections = net.forward()`
			`bboxes = []`
when no face is found, use middle of webcam image. 4 years ago			`face_found = False`
First Commit 4 years ago			`for i in range(detections.shape[2]):`
			`confidence = detections[0, 0, i, 2]`
			`if confidence > 0.8:`
when no face is found, use middle of webcam image. 4 years ago			`face_found = True`
First Commit 4 years ago			`x1 = int(detections[0, 0, i, 3] * frameWidth)`
			`y1 = int(detections[0, 0, i, 4] * frameHeight)`
			`x2 = int(detections[0, 0, i, 5] * frameWidth)`
			`y2 = int(detections[0, 0, i, 6] * frameHeight)`

			`face_margin_w = int(256 - (abs(x1-x2) -.5))`
			`face_margin_h = int(256 - (abs(y1-y2) -.5))`

			`cut_x1 = (x1 - int(face_margin_w/2))`
			`if cut_x1<0: cut_x1=0`
			`cut_y1 = y1 - int(2*face_margin_h/3)`
			`if cut_y1<0: cut_y1=0`
			`cut_x2 = x2 + int(face_margin_w/2)`
			`cut_y2 = y2 + int(face_margin_h/3)`

when no face is found, use middle of webcam image. 4 years ago			`if not face_found:`
			`print("No face detected in video")`
			`# let's just use the middle section of the image`
			`cut_x1,cut_y1,cut_x2,cut_y2 = 112,192,368,448`
First Commit 4 years ago			`else:`
			`print(f'Found face at: ({x1,y1}) ({x2},{y2} width:{abs(x2-x1)} height: {abs(y2-y1)})')`
			`print(f'Cutting at: ({cut_x1,cut_y1}) ({cut_x2},{cut_y2} width:{abs(cut_x2-cut_x1)} height: {abs(cut_y2-cut_y1)})')`


			`return cut_x1,cut_y1,cut_x2,cut_y2`

Key B for previous image 4 years ago			`def readimage():`
			`global img_list,img_shape`
			`img = imageio.imread(img_list[pos])`
			`img_shape = img.shape`
			`cv2.resizeWindow('DeepFake', int(img_shape[1] / img_shape[0] * 256), 256)`
			`img = resize(img, (256, 256))[..., :3]`
			`return img`

			`def readpreviousimage():`
			`global pos`
			`if pos<len(img_list)-1:`
			`pos=pos-1`
			`else:`
			`pos=0`
			`return readimage()`

First Commit 4 years ago			`def readnextimage(position=-1):`
Key B for previous image 4 years ago			`global pos`
First Commit 4 years ago			`if (position != -1):`
			`pos = position`
			`else:`
			`if pos<len(img_list)-1:`
			`pos=pos+1`
			`else:`
			`pos=0`
Key B for previous image 4 years ago			`return readimage()`
First Commit 4 years ago
			`main()`