Academic-Hammer · fanykks · Jan 30, 2024 · Jan 30, 2024 · Jan 30, 2024 · Jan 30, 2024
diff --git a/2_md_files/064cb830-bec5-11ee-8e17-d3ef749341c8.jpeg b/2_md_files/064cb830-bec5-11ee-8e17-d3ef749341c8.jpeg
diff --git a/2_md_files/17fb7da0-bec0-11ee-8e17-d3ef749341c8.jpeg b/2_md_files/17fb7da0-bec0-11ee-8e17-d3ef749341c8.jpeg
diff --git a/2_md_files/470fc0b0-beca-11ee-8e17-d3ef749341c8.jpeg b/2_md_files/470fc0b0-beca-11ee-8e17-d3ef749341c8.jpeg
diff --git a/2_md_files/61927210-becb-11ee-b5a9-f503f59f5266.jpeg b/2_md_files/61927210-becb-11ee-b5a9-f503f59f5266.jpeg
diff --git a/2_md_files/8c5891b0-beca-11ee-8e17-d3ef749341c8.jpeg b/2_md_files/8c5891b0-beca-11ee-8e17-d3ef749341c8.jpeg
diff --git a/2_md_files/91393db0-bec0-11ee-8e17-d3ef749341c8.jpeg b/2_md_files/91393db0-bec0-11ee-8e17-d3ef749341c8.jpeg
diff --git a/2_md_files/9f0267b0-bebf-11ee-8e17-d3ef749341c8.jpeg b/2_md_files/9f0267b0-bebf-11ee-8e17-d3ef749341c8.jpeg
diff --git a/2_md_files/aeff1d70-bf14-11ee-9dd8-19a61b89b502.jpeg b/2_md_files/aeff1d70-bf14-11ee-9dd8-19a61b89b502.jpeg
diff --git a/README.md b/README.md
diff --git a/talkingface/data/dataprocess/PHADTF_process.py b/talkingface/data/dataprocess/PHADTF_process.py
@@ -0,0 +1,65 @@
+import cv2
+import os, sys
+import glob
+import dlib
+import numpy as np
+import time
+import pdb
+detector = dlib.get_frontal_face_detector()
+predictor = dlib.shape_predictor('../Deep3DFaceReconstruction/shape_predictor_68_face_landmarks.dat')
+
+def shape_to_np(shape, dtype="int"):
+    # initialize the list of (x, y)-coordinates
+    coords = np.zeros((shape.num_parts, 2), dtype=dtype)
+
+    # loop over all facial landmarks and convert them
+    # to a 2-tuple of (x, y)-coordinates
+    for i in range(0, shape.num_parts):
+        coords[i] = (shape.part(i).x, shape.part(i).y)
+
+    # return the list of (x, y)-coordinates
+    return coords
+
+def detect_image(imagename, savepath=""):
+    image = cv2.imread(imagename)
+    gray = cv2.cvtColor(image, cv2.COLOR_BGR2GRAY)
+    rects = detector(gray, 1)
+    for (i, rect) in enumerate(rects):
+        shape = predictor(gray, rect)
+        shape = shape_to_np(shape)
+        for (x, y) in shape:
+            cv2.circle(image, (x, y), 1, (0, 0, 255), -1)
+        eyel = np.round(np.mean(shape[36:42,:],axis=0)).astype("int")
+        eyer = np.round(np.mean(shape[42:48,:],axis=0)).astype("int")
+        nose = shape[33]
+        mouthl = shape[48]
+        mouthr = shape[54]
+        if savepath != "":
+            message = '%d %d\n%d %d\n%d %d\n%d %d\n%d %d\n' % (eyel[0],eyel[1],
+                eyer[0],eyer[1],nose[0],nose[1],
+                mouthl[0],mouthl[1],mouthr[0],mouthr[1])
+            with open(savepath, 'w') as s_file:
+                s_file.write(message)
+            return
+def detect_dir(folder):
+    for file in sorted(glob.glob(folder+"/*.jpg")+glob.glob(folder+"/*.png")):
+        print(file)
+        detect_image(imagename=file, savepath=file[:-4]+'.txt')
+
+t1 = time.time()
+mp4 = sys.argv[1]
+videoname = mp4
+cap = cv2.VideoCapture(videoname)
+length = int(cap.get(cv2.CAP_PROP_FRAME_COUNT))
+#print videoname, length
+success, image = cap.read()
+postfix = ".png"
+if not os.path.exists(mp4[:-4]):
+    os.makedirs(mp4[:-4])
+count = 0
+while count<400:
+    cv2.imwrite("%s/frame%d%s"%(mp4[:-4],count,postfix),image)
+    success, image = cap.read()
+    count += 1
+detect_dir(mp4[:-4])
+t2 = time.time()
diff --git a/talkingface/data/dataset/PHADTF_GAN_dataset.py b/talkingface/data/dataset/PHADTF_GAN_dataset.py
@@ -0,0 +1,171 @@
+import os.path
+from PIL import Image
+import numpy as np
+import torch
+from .dataset import *
+
+class PHADTD_GAN_dataset(Dataset):
+    def __init__(self,isTrain=True):
+        if isTrain:
+            self.set=SingleMultiDataset()
+        else:
+            self.set=AlignedFeatureMultiDataset()
+    def __getitem__(self,index):
+        return self.set.__getitem__(index)
+
+class SingleMultiDataset(Dataset):
+    """This dataset class can load a set of images specified by the path --dataroot /path/to/data.
+
+    It can be used for generating CycleGAN results only for one side with the model option '-model test'.
+    """
+
+    def __init__(self, opt):
+        """Initialize this dataset class.
+
+        Parameters:
+            opt (Option class) -- stores all the experiment flags; needs to be a subclass of BaseOptions
+        """
+        BaseDataset.__init__(self, opt)
+        imglistA = 'datasets/list/%s/%s.txt' % (opt.phase+'Single', opt.dataroot)
+        if not os.path.exists(imglistA):
+            self.A_paths = sorted(make_dataset(opt.dataroot, opt.max_dataset_size))
+        else:
+            self.A_paths = open(imglistA, 'r').read().splitlines()
+        self.input_nc = self.opt.output_nc if self.opt.direction == 'BtoA' else self.opt.input_nc
+        self.Nw = self.opt.Nw
+
+    def __getitem__(self, index):
+        """Return a data point and its metadata information.
+
+        Parameters:
+            index - - a random integer for data indexing
+
+        Returns a dictionary that contains A and A_paths
+            A(tensor) - - an image in one domain
+            A_paths(str) - - the path of the image
+        """
+        A_path = self.A_paths[index]
+        A_img = Image.open(A_path).convert('RGB')
+
+        # apply the same transform to both A and resnet_input
+        transform_params = get_params(self.opt, A_img.size)
+        A_transform = get_transform(self.opt, transform_params, grayscale=(self.input_nc == 1), method=self.opt.resizemethod)
+        A = A_transform(A_img)
+        As = torch.zeros((self.input_nc * self.Nw, self.opt.crop_size, self.opt.crop_size))
+        As[-self.input_nc:] = A
+        frame = os.path.basename(A_path).split('_')[0]
+        ext = os.path.basename(A_path).split('_')[1]
+        frameno = int(frame)
+        for i in range(1,self.Nw):
+            # read frameno-i frame
+            path1 = A_path.replace(frame+'_blend','%05d_blend'%(frameno-i))
+            A = Image.open(path1).convert('RGB')
+            # store in Nw-i's
+            As[-(i+1)*self.input_nc:-i*self.input_nc] = A_transform(A)
+        item = {'A': As, 'A_paths': A_path}
+
+        if self.opt.use_memory:
+            resnet_transform = get_transform(self.opt, transform_params, grayscale=False, resnet=True, method=self.opt.resizemethod)
+            resnet_input = resnet_transform(A_img)
+            item['resnet_input'] = resnet_input
+
+        return item
+
+    def __len__(self):
+        """Return the total number of images in the dataset."""
+        return len(self.A_paths)
+
+
+class AlignedFeatureMultiDataset(Dataset):
+    """A dataset class for paired image dataset.
+
+    It assumes that the directory '/path/to/data/train' contains image pairs in the form of {A,B}.
+    During test time, you need to prepare a directory '/path/to/data/test'.
+    """
+
+    def __init__(self, opt):
+        """Initialize this dataset class.
+
+        Parameters:
+            opt (Option class) -- stores all the experiment flags; needs to be a subclass of BaseOptions
+        """
+        BaseDataset.__init__(self, opt)
+
+        imglistA = 'datasets/list/%s/%s.txt' % (opt.phase+'A', opt.dataroot)
+        imglistB = 'datasets/list/%s/%s.txt' % (opt.phase+'B', opt.dataroot)
+
+        if not os.path.exists(imglistA) or not os.path.exists(imglistB):
+            self.dir_AB = os.path.join(opt.dataroot, opt.phase)  # get the image directory
+            self.AB_paths = sorted(make_dataset(self.dir_AB, opt.max_dataset_size))  # get image paths
+        else:
+            self.AB_paths = open(imglistA, 'r').read().splitlines()
+            self.AB_paths2 = open(imglistB, 'r').read().splitlines()
+
+        assert(self.opt.load_size >= self.opt.crop_size)   # crop_size should be smaller than the size of loaded image
+        self.input_nc = self.opt.output_nc if self.opt.direction == 'BtoA' else self.opt.input_nc
+        self.output_nc = self.opt.input_nc if self.opt.direction == 'BtoA' else self.opt.output_nc
+        self.Nw = self.opt.Nw
+
+    def __getitem__(self, index):
+        """Return a data point and its metadata information.
+
+        Parameters:
+            index - - a random integer for data indexing
+
+        Returns a dictionary that contains A, B, A_paths and B_paths
+            A (tensor) - - an image in the input domain
+            B (tensor) - - its corresponding image in the target domain
+            A_paths (str) - - image paths
+            B_paths (str) - - image paths (same as A_paths)
+        """
+        # read a image given a random integer index
+        # by default A and B are from 2 png
+        AB_path = self.AB_paths[index]
+        A = Image.open(AB_path).convert('RGB')
+        AB_path2 = self.AB_paths2[index]
+        B = Image.open(AB_path2).convert('RGB')
+
+        # apply the same transform to both A and B
+        transform_params = get_params(self.opt, A.size)
+        A_transform = get_transform(self.opt, transform_params, grayscale=(self.input_nc == 1), method=self.opt.resizemethod)
+        B_transform = get_transform(self.opt, transform_params, grayscale=(self.output_nc == 1),method=self.opt.resizemethod)
+        resnet_transform = get_transform(self.opt, transform_params, grayscale=False, resnet=True, method=self.opt.resizemethod)
+
+        imA = A
+        A = A_transform(A)
+        B = B_transform(B)
+        resnet_input = resnet_transform(imA)
+
+        As = torch.zeros((self.input_nc * self.Nw, self.opt.crop_size, self.opt.crop_size))
+        As[-self.input_nc:] = A
+        frame = os.path.basename(AB_path).split('_')[0]
+        frameno = int(frame[5:])
+        for i in range(1,self.Nw):
+            # read frameno-i frame
+            path1 = AB_path.replace(frame,'frame%d'%(frameno-i))
+            A = Image.open(path1).convert('RGB')
+            # store in Nw-i's
+            As[-(i+1)*self.input_nc:-i*self.input_nc] = A_transform(A)
+
+        item = {'A': As, 'B': B, 'A_paths': AB_path, 'B_paths': AB_path2}
+        item['resnet_input'] = resnet_input
+        item['index'] = np.array(([index+0.0])).astype(np.float32)[0]
+
+        if self.opt.isTrain or self.opt.test_use_gt:
+            AB_path2 = AB_path2.replace('_input2','')
+            ss = AB_path2.split('/')
+            if self.opt.dataroot != '300vw_win3' and self.opt.dataroot != 'lrwnewrender_win3' and ss[-3] != '19_news':
+                B_feat = np.load(os.path.join(self.opt.iden_feat_dir,ss[-2],ss[-1][:-4]+'.npy'))
+            elif self.opt.dataroot == '300vw_win3':
+                B_feat = np.load(os.path.join(self.opt.iden_feat_dir,ss[-3],ss[-2],ss[-1][:-4]+'.npy'))
+            elif self.opt.dataroot == 'lrwnewrender_win3':
+                B_feat = np.load(os.path.join(self.opt.iden_feat_dir,ss[-4],ss[-3],ss[-2],'frame14.npy'))
+            elif ss[-3] == '19_news':
+                B_feat = np.load(os.path.join(self.opt.iden_feat_dir,ss[-3],ss[-2],ss[-1][:-4]+'.npy'))
+            item['B_feat'] = B_feat
+
+        return item
+
+    def __len__(self):
+        """Return the total number of images in the dataset."""
+        return len(self.AB_paths)