FaceForensics++数据集处理

款姥爷

已于 2024-06-17 16:02:27 修改

阅读量995

点赞数 10

文章标签：人工智能算法机器学习

于 2024-06-17 15:59:12 首次发布

本文链接：https://blog.csdn.net/weixin_45640448/article/details/139746232

版权

这篇文章是对官方的数据集分成train、test、val的脚本。
纯原创，可能有些部分比较繁琐，大佬们嘴下留情。

一共分两部分，对真视频的处理脚本和对假视频的处理脚本

首先

将官方给的三个json保存到相应目录里。
官网地址：GitCode - 全球开发者的开源社区,开源代码托管平台

接下来

对真视频的处理：需要改的地方就是你的数据集地址以及处理之后的地址。

import os
import json
import shutil

with open('test.json', 'r', encoding='utf-8') as f_test:
    data_test = json.load(f_test)
with open('train.json', 'r', encoding='utf-8') as f_train:
    data_train = json.load(f_train)
with open('val.json', 'r', encoding='utf-8') as f_val:
    data_val = json.load(f_val)

source_folder = '/FaceForensics++/C40/original_sequences/youtube/c40/videos'
test_target_folder = '/FaceForensics++/C40/deelvideo/true/test/videos'
train_target_folder = '/FaceForensics++/C40/deelvideo/true/train/videos'
val_target_folder = '/FaceForensics++/C40/deelvideo/true/val/videos'

if not os.path.exists(test_target_folder):
    os.makedirs(test_target_folder)

for item in data_test:
    for i in item:
        file_name = f"{i}.mp4"
        source_file_path = os.path.join(source_folder, file_name)
        target_file_path = os.path.join(test_target_folder, file_name)
        if os.path.exists(source_file_path):
            shutil.copy(source_file_path, target_file_path)

if not os.path.exists(train_target_folder):
    os.makedirs(train_target_folder)

for item in data_train:
    for i in item:
        file_name = f"{i}.mp4"
        source_file_path = os.path.join(source_folder, file_name)
        target_file_path = os.path.join(train_target_folder, file_name)
        if os.path.exists(source_file_path):
            shutil.copy(source_file_path, target_file_path)

if not os.path.exists(val_target_folder):
    os.makedirs(val_target_folder)

for item in data_val:
    for i in item:
        file_name = f"{i}.mp4"
        source_file_path = os.path.join(source_folder, file_name)
        target_file_path = os.path.join(val_target_folder, file_name)
        if os.path.exists(source_file_path):
            shutil.copy(source_file_path, target_file_path)

然后

对假视频的处理：同样要去修改source_folder、test_target_folder、train_target_folder、val_target_folder这三个地址，不过这里需要对每个操作方法都要重新修改一下地址，这里我没做一个遍历，只能手动改一下了。例如：/FaceForensics++/C40/manipulated_sequences/NeuralTextures/c40/videos，这个地址是对NeuralTextures进行的处理，处理完修改地址中的NeuralTextures改成Deepfakes就可以了。

import os
import json
import shutil

with open('test.json', 'r', encoding='utf-8') as f_test:
    data_test = json.load(f_test)
with open('train.json', 'r', encoding='utf-8') as f_train:
    data_train = json.load(f_train)
with open('val.json', 'r', encoding='utf-8') as f_val:
    data_val = json.load(f_val)

source_folder = '/FaceForensics++/C40/manipulated_sequences/NeuralTextures/c40/videos'
test_target_folder = '/FaceForensics++/C40/deelvideo/false/NeuralTextures/test/videos'
train_target_folder = '/FaceForensics++/C40/deelvideo/false/NeuralTextures/train/videos'
val_target_folder = '/FaceForensics++/C40/deelvideo/false/NeuralTextures/val/videos'

if not os.path.exists(test_target_folder):
    os.makedirs(test_target_folder)

for item in data_test:
    num = 0
    for i in item:
        file_name = f"{item[num]}_{item[1-num]}.mp4"
        source_file_path = os.path.join(source_folder, file_name)
        target_file_path = os.path.join(test_target_folder, file_name)
        if os.path.exists(source_file_path):
            shutil.copy(source_file_path, target_file_path)
        num = num + 1

if not os.path.exists(train_target_folder):
    os.makedirs(train_target_folder)

for item in data_train:
    num = 0
    for i in item:
        file_name = f"{item[num]}_{item[1-num]}.mp4"
        source_file_path = os.path.join(source_folder, file_name)
        target_file_path = os.path.join(train_target_folder, file_name)
        if os.path.exists(source_file_path):
            shutil.copy(source_file_path, target_file_path)
        num = num + 1

if not os.path.exists(val_target_folder):
    os.makedirs(val_target_folder)

for item in data_val:
    num = 0
    for i in item:
        file_name = f"{item[num]}_{item[1-num]}.mp4"
        source_file_path = os.path.join(source_folder, file_name)
        target_file_path = os.path.join(val_target_folder, file_name)
        if os.path.exists(source_file_path):
            shutil.copy(source_file_path, target_file_path)
        num = num + 1