faceswap/scripts/convert.py at master · ag-python/faceswap

History

1198 lines (1021 loc) · 48.5 KB

Raw

100

101

102

103

104

105

106

107

108

109

110

111

112

113

114

115

116

117

118

119

120

121

122

123

124

125

126

127

128

129

130

131

132

133

134

135

136

137

138

139

140

141

142

143

144

145

146

147

148

149

150

151

152

153

154

155

156

157

158

159

160

161

162

163

164

165

166

167

168

169

170

171

172

173

174

175

176

177

178

179

180

181

182

183

184

185

186

187

188

189

190

191

192

193

194

195

196

197

198

199

200

201

202

203

204

205

206

207

208

209

210

211

212

213

214

215

216

217

218

219

220

221

222

223

224

225

226

227

228

229

230

231

232

233

234

235

236

237

238

239

240

241

242

243

244

245

246

247

248

249

250

251

252

253

254

255

256

257

258

259

260

261

262

263

264

265

266

267

268

269

270

271

272

273

274

275

276

277

278

279

280

281

282

283

284

285

286

287

288

289

290

291

292

293

294

295

296

297

298

299

300

301

302

303

304

305

306

307

308

309

310

311

312

313

314

315

316

317

318

319

320

321

322

323

324

325

326

327

328

329

330

331

332

333

334

335

336

337

338

339

340

341

342

343

344

345

346

347

348

349

350

351

352

353

354

355

356

357

358

359

360

361

362

363

364

365

366

367

368

369

370

371

372

373

374

375

376

377

378

379

380

381

382

383

384

385

386

387

388

389

390

391

392

393

394

395

396

397

398

399

400

401

402

403

404

405

406

407

408

409

410

411

412

413

414

415

416

417

418

419

420

421

422

423

424

425

426

427

428

429

430

431

432

433

434

435

436

437

438

439

440

441

442

443

444

445

446

447

448

449

450

451

452

453

454

455

456

457

458

459

460

461

462

463

464

465

466

467

468

469

470

471

472

473

474

475

476

477

478

479

480

481

482

483

484

485

486

487

488

489

490

491

492

493

494

495

496

497

498

499

500

501

502

503

504

505

506

507

508

509

510

511

512

513

514

515

516

517

518

519

520

521

522

523

524

525

526

527

528

529

530

531

532

533

534

535

536

537

538

539

540

541

542

543

544

545

546

547

548

549

550

551

552

553

554

555

556

557

558

559

560

561

562

563

564

565

566

567

568

569

570

571

572

573

574

575

576

577

578

579

580

581

582

583

584

585

586

587

588

589

590

591

592

593

594

595

596

597

598

599

600

601

602

603

604

605

606

607

608

609

610

611

612

613

614

615

616

617

618

619

620

621

622

623

624

625

626

627

628

629

630

631

632

633

634

635

636

637

638

639

640

641

642

643

644

645

646

647

648

649

650

651

652

653

654

655

656

657

658

659

660

661

662

663

664

665

666

667

668

669

670

671

672

673

674

675

676

677

678

679

680

681

682

683

684

685

686

687

688

689

690

691

692

693

694

695

696

697

698

699

700

701

702

703

704

705

706

707

708

709

710

711

712

713

714

715

716

717

718

719

720

721

722

723

724

725

726

727

728

729

730

731

732

733

734

735

736

737

738

739

740

741

742

743

744

745

746

747

748

749

750

751

752

753

754

755

756

757

758

759

760

761

762

763

764

765

766

767

768

769

770

771

772

773

774

775

776

777

778

779

780

781

782

783

784

785

786

787

788

789

790

791

792

793

794

795

796

797

798

799

800

801

802

803

804

805

806

807

808

809

810

811

812

813

814

815

816

817

818

819

820

821

822

823

824

825

826

827

828

829

830

831

832

833

834

835

836

837

838

839

840

841

842

843

844

845

846

847

848

849

850

851

852

853

854

855

856

857

858

859

860

861

862

863

864

865

866

867

868

869

870

871

872

873

874

875

876

877

878

879

880

881

882

883

884

885

886

887

888

889

890

891

892

893

894

895

896

897

898

899

900

901

902

903

904

905

906

907

908

909

910

911

912

913

914

915

916

917

918

919

920

921

922

923

924

925

926

927

928

929

930

931

932

933

934

935

936

937

938

939

940

941

942

943

944

945

946

947

948

949

950

951

952

953

954

955

956

957

958

959

960

961

962

963

964

965

966

967

968

969

970

971

972

973

974

975

976

977

978

979

980

981

982

983

984

985

986

987

988

989

990

991

992

993

994

995

996

997

998

999

1000

#!/usr/bin python3

""" Main entry point to the convert process of FaceSwap """

from __future__ import annotations

from dataclasses import dataclass, field

import logging

import re

import os

import sys

import typing as T

from threading import Event

from time import sleep

import cv2

import numpy as np

from tqdm import tqdm

from scripts.fsmedia import Alignments, PostProcess, finalize

from lib.serializer import get_serializer

from lib.convert import Converter

from lib.align import AlignedFace, DetectedFace, update_legacy_png_header

from lib.gpu_stats import GPUStats

from lib.image import read_image_meta_batch, ImagesLoader

from lib.multithreading import MultiThread, total_cpus

from lib.queue_manager import queue_manager

from lib.utils import FaceswapError, get_folder, get_image_paths, handle_deprecated_cliopts

from plugins.extract import ExtractMedia, Extractor

from plugins.plugin_loader import PluginLoader

if T.TYPE_CHECKING:

from argparse import Namespace

from collections.abc import Callable

from plugins.convert.writer._base import Output

from plugins.train.model._base import ModelBase

from lib.align.aligned_face import CenteringType

from lib.queue_manager import EventQueue

logger = logging.getLogger(__name__)

@dataclass

class ConvertItem:

""" A single frame with associated objects passing through the convert process.

Parameters

----------

input: :class:`~plugins.extract.extract_media.ExtractMedia`

The ExtractMedia object holding the :attr:`filename`, :attr:`image` and attr:`list` of

:class:`~lib.align.DetectedFace` objects loaded from disk

feed_faces: list, Optional

list of :class:`lib.align.AlignedFace` objects for feeding into the model's predict

function

reference_faces: list, Optional

list of :class:`lib.align.AlignedFace` objects at model output sized for using as reference

in the convert functionfor feeding into the model's predict

swapped_faces: :class:`np.ndarray`

The swapped faces returned from the model's predict function

"""

inbound: ExtractMedia

feed_faces: list[AlignedFace] = field(default_factory=list)

reference_faces: list[AlignedFace] = field(default_factory=list)

swapped_faces: np.ndarray = np.array([])

class Convert():

""" The Faceswap Face Conversion Process.

The conversion process is responsible for swapping the faces on source frames with the output

from a trained model.

It leverages a series of user selected post-processing plugins, executed from

:class:`lib.convert.Converter`.

The convert process is self contained and should not be referenced by any other scripts, so it

contains no public properties.

Parameters

----------

arguments: :class:`argparse.Namespace`

The arguments to be passed to the convert process as generated from Faceswap's command

line arguments

"""

def __init__(self, arguments: Namespace) -> None:

logger.debug("Initializing %s: (args: %s)", self.__class__.__name__, arguments)

self._args = handle_deprecated_cliopts(arguments)

self._images = ImagesLoader(self._args.input_dir, fast_count=True)

self._alignments = self._get_alignments()

self._opts = OptionalActions(self._args, self._images.file_list, self._alignments)

self._add_queues()

self._predictor = Predict(self._queue_size, arguments)

self._disk_io = DiskIO(self._alignments, self._images, self._predictor, arguments)

self._predictor.launch(self._disk_io.load_queue)

self._validate()

get_folder(self._args.output_dir)

configfile = self._args.configfile if hasattr(self._args, "configfile") else None

self._converter = Converter(self._predictor.output_size,

self._predictor.coverage_ratio,

self._predictor.centering,

self._disk_io.draw_transparent,

self._disk_io.pre_encode,

arguments,

configfile=configfile)

self._patch_threads = self._get_threads()

logger.debug("Initialized %s", self.__class__.__name__)

@property

def _queue_size(self) -> int:

""" int: Size of the converter queues. 2 for single process otherwise 4 """

retval = 2 if self._args.singleprocess or self._args.jobs == 1 else 4

logger.debug(retval)

return retval

@property

def _pool_processes(self) -> int:

""" int: The number of threads to run in parallel. Based on user options and number of

available processors. """

if self._args.singleprocess:

retval = 1

elif self._args.jobs > 0:

retval = min(self._args.jobs, total_cpus(), self._images.count)

else:

retval = min(total_cpus(), self._images.count)

retval = 1 if retval == 0 else retval

logger.debug(retval)

return retval

def _get_alignments(self) -> Alignments:

""" Perform validation checks and legacy updates and return alignemnts object

Returns

-------

:class:`~lib.align.alignments.Alignments`

The alignments file for the extract job

"""

retval = Alignments(self._args, False, self._images.is_video)

if retval.version == 1.0:

logger.error("The alignments file format has been updated since the given alignments "

"file was generated. You need to update the file to proceed.")

logger.error("To do this run the 'Alignments Tool' > 'Extract' Job.")

sys.exit(1)

retval.update_legacy_has_source(os.path.basename(self._args.input_dir))

return retval

def _validate(self) -> None:

""" Validate the Command Line Options.

Ensure that certain cli selections are valid and won't result in an error. Checks:

* If frames have been passed in with video output, ensure user supplies reference

video.

* If "on-the-fly" and a Neural Network mask is selected, warn and switch to 'extended'

* If a mask-type is selected, ensure it exists in the alignments file.

* If a predicted mask-type is selected, ensure model has been trained with a mask

otherwise attempt to select first available masks, otherwise raise error.

Raises

------

FaceswapError

If an invalid selection has been found.

"""

if (self._args.writer == "ffmpeg" and

not self._images.is_video and

self._args.reference_video is None):

raise FaceswapError("Output as video selected, but using frames as input. You must "

"provide a reference video ('-ref', '--reference-video').")

if (self._args.on_the_fly and

self._args.mask_type not in ("none", "extended", "components")):

logger.warning("You have selected an incompatible mask type ('%s') for On-The-Fly "

"conversion. Switching to 'extended'", self._args.mask_type)

self._args.mask_type = "extended"

if (not self._args.on_the_fly and

self._args.mask_type not in ("none", "predicted") and

not self._alignments.mask_is_valid(self._args.mask_type)):

msg = (f"You have selected the Mask Type `{self._args.mask_type}` but at least one "

"face does not have this mask stored in the Alignments File.\nYou should "

"generate the required masks with the Mask Tool or set the Mask Type option to "

"an existing Mask Type.\nA summary of existing masks is as follows:\nTotal "

f"faces: {self._alignments.faces_count}, "

f"Masks: {self._alignments.mask_summary}")

raise FaceswapError(msg)

if self._args.mask_type == "predicted" and not self._predictor.has_predicted_mask:

available_masks = [k for k, v in self._alignments.mask_summary.items()

if k != "none" and v == self._alignments.faces_count]

if not available_masks:

msg = ("Predicted Mask selected, but the model was not trained with a mask and no "

"masks are stored in the Alignments File.\nYou should generate the "

"required masks with the Mask Tool or set the Mask Type to `none`.")

raise FaceswapError(msg)

mask_type = available_masks[0]

logger.warning("Predicted Mask selected, but the model was not trained with a "

"mask. Selecting first available mask: '%s'", mask_type)

self._args.mask_type = mask_type

def _add_queues(self) -> None:

""" Add the queues for in, patch and out. """

logger.debug("Adding queues. Queue size: %s", self._queue_size)

for qname in ("convert_in", "convert_out", "patch"):

queue_manager.add_queue(qname, self._queue_size)

def _get_threads(self) -> MultiThread:

""" Get the threads for patching the converted faces onto the frames.

Returns

:class:`lib.multithreading.MultiThread`

The threads that perform the patching of swapped faces onto the output frames

"""

save_queue = queue_manager.get_queue("convert_out")

patch_queue = queue_manager.get_queue("patch")

return MultiThread(self._converter.process, patch_queue, save_queue,

thread_count=self._pool_processes, name="patch")

def process(self) -> None:

""" The entry point for triggering the Conversion Process.

Should only be called from :class:`lib.cli.launcher.ScriptExecutor`

Raises

------

FaceswapError

Error raised if the process runs out of memory

"""

logger.debug("Starting Conversion")

# queue_manager.debug_monitor(5)

try:

self._convert_images()

self._disk_io.save_thread.join()

queue_manager.terminate_queues()

finalize(self._images.count,

self._predictor.faces_count,

self._predictor.verify_output)

logger.debug("Completed Conversion")

except MemoryError as err:

msg = ("Faceswap ran out of RAM running convert. Conversion is very system RAM "

"heavy, so this can happen in certain circumstances when you have a lot of "

"cpus but not enough RAM to support them all."

"\nYou should lower the number of processes in use by either setting the "

"'singleprocess' flag (-sp) or lowering the number of parallel jobs (-j).")

raise FaceswapError(msg) from err

def _convert_images(self) -> None:

""" Start the multi-threaded patching process, monitor all threads for errors and join on

completion. """

logger.debug("Converting images")

self._patch_threads.start()

while True:

self._check_thread_error()

if self._disk_io.completion_event.is_set():

logger.debug("DiskIO completion event set. Joining Pool")

break

if self._patch_threads.completed():

logger.debug("All patch threads completed")

break

sleep(1)

self._patch_threads.join()

logger.debug("Putting EOF")

queue_manager.get_queue("convert_out").put("EOF")

logger.debug("Converted images")

def _check_thread_error(self) -> None:

""" Monitor all running threads for errors, and raise accordingly.

Raises

------

Error

Re-raises any error encountered within any of the running threads

"""

for thread in (self._predictor.thread,

self._disk_io.load_thread,

self._disk_io.save_thread,

self._patch_threads):

thread.check_and_raise_error()

class DiskIO():

""" Disk Input/Output for the converter process.

Background threads to:

* Load images from disk and get the detected faces

* Save images back to disk

Parameters

----------

alignments: :class:`lib.alignmnents.Alignments`

The alignments for the input video

images: :class:`lib.image.ImagesLoader`

The input images

predictor: :class:`Predict`

The object for generating predictions from the model

arguments: :class:`argparse.Namespace`

The arguments that were passed to the convert process as generated from Faceswap's command

line arguments

"""

def __init__(self,

alignments: Alignments,

images: ImagesLoader,

predictor: Predict,

arguments: Namespace) -> None:

logger.debug("Initializing %s: (alignments: %s, images: %s, predictor: %s, arguments: %s)",

self.__class__.__name__, alignments, images, predictor, arguments)

self._alignments = alignments

self._images = images

self._args = arguments

self._pre_process = PostProcess(arguments)

self._completion_event = Event()

# For frame skipping

self._imageidxre = re.compile(r"(\d+)(?!.*\d\.)(?=\.\w+$)")

self._frame_ranges = self._get_frame_ranges()

self._writer = self._get_writer(predictor)

# Extractor for on the fly detection

self._extractor = self._load_extractor()

self._queues: dict[T.Literal["load", "save"], EventQueue] = {}

self._threads: dict[T.Literal["load", "save"], MultiThread] = {}

self._init_threads()

logger.debug("Initialized %s", self.__class__.__name__)

@property

def completion_event(self) -> Event:

""" :class:`event.Event`: Event is set when the DiskIO Save task is complete """

return self._completion_event

@property

def draw_transparent(self) -> bool:

""" bool: ``True`` if the selected writer's Draw_transparent configuration item is set

otherwise ``False`` """

return self._writer.config.get("draw_transparent", False)

@property

def pre_encode(self) -> Callable[[np.ndarray, T.Any], list[bytes]] | None:

""" python function: Selected writer's pre-encode function, if it has one,

otherwise ``None`` """

dummy = np.zeros((20, 20, 3), dtype="uint8")

test = self._writer.pre_encode(dummy)

retval: Callable | None = None if test is None else self._writer.pre_encode

logger.debug("Writer pre_encode function: %s", retval)

return retval

@property

def save_thread(self) -> MultiThread:

""" :class:`lib.multithreading.MultiThread`: The thread that is running the image writing

operation. """

return self._threads["save"]

@property

def load_thread(self) -> MultiThread:

""" :class:`lib.multithreading.MultiThread`: The thread that is running the image loading

operation. """

return self._threads["load"]

@property

def load_queue(self) -> EventQueue:

""" :class:`~lib.queue_manager.EventQueue`: The queue that images and detected faces are "

"loaded into. """

return self._queues["load"]

@property

def _total_count(self) -> int:

""" int: The total number of frames to be converted """

if self._frame_ranges and not self._args.keep_unchanged:

retval = sum(fr[1] - fr[0] + 1 for fr in self._frame_ranges)

else:

retval = self._images.count

logger.debug(retval)

return retval

# Initialization

def _get_writer(self, predictor: Predict) -> Output:

""" Load the selected writer plugin.

Parameters

----------

predictor: :class:`Predict`

The object for generating predictions from the model

Returns

-------

:mod:`plugins.convert.writer` plugin

The requested writer plugin

"""

args = [self._args.output_dir]

if self._args.writer in ("ffmpeg", "gif"):

args.extend([self._total_count, self._frame_ranges])

if self._args.writer == "ffmpeg":

if self._images.is_video:

args.append(self._args.input_dir)

else:

args.append(self._args.reference_video)

if self._args.writer == "patch":

args.append(predictor.output_size)

logger.debug("Writer args: %s", args)

configfile = self._args.configfile if hasattr(self._args, "configfile") else None

return PluginLoader.get_converter("writer", self._args.writer)(*args,

configfile=configfile)

def _get_frame_ranges(self) -> list[tuple[int, int]] | None:

""" Obtain the frame ranges that are to be converted.

If frame ranges have been specified, then split the command line formatted arguments into

ranges that can be used.

Returns

list or ``None``

A list of frames to be processed, or ``None`` if the command line argument was not

used

"""

if not self._args.frame_ranges:

logger.debug("No frame range set")

return None

minframe, maxframe = None, None

if self._images.is_video:

minframe, maxframe = 1, self._images.count

else:

indices = [int(self._imageidxre.findall(os.path.basename(filename))[0])

for filename in self._images.file_list]

if indices:

minframe, maxframe = min(indices), max(indices)

logger.debug("minframe: %s, maxframe: %s", minframe, maxframe)

if minframe is None or maxframe is None:

raise FaceswapError("Frame Ranges specified, but could not determine frame numbering "

"from filenames")

retval = []

for rng in self._args.frame_ranges:

if "-" not in rng:

raise FaceswapError("Frame Ranges not specified in the correct format")

start, end = rng.split("-")

retval.append((max(int(start), minframe), min(int(end), maxframe)))

logger.debug("frame ranges: %s", retval)

return retval

def _load_extractor(self) -> Extractor | None:

""" Load the CV2-DNN Face Extractor Chain.

For On-The-Fly conversion we use a CPU based extractor to avoid stacking the GPU.

Results are poor.

Returns

-------

:class:`plugins.extract.Pipeline.Extractor`

The face extraction chain to be used for on-the-fly conversion

"""

if not self._alignments.have_alignments_file and not self._args.on_the_fly:

logger.error("No alignments file found. Please provide an alignments file for your "

"destination video (recommended) or enable on-the-fly conversion (not "

"recommended).")

sys.exit(1)

if self._alignments.have_alignments_file:

if self._args.on_the_fly:

logger.info("On-The-Fly conversion selected, but an alignments file was found. "

"Using pre-existing alignments file: '%s'", self._alignments.file)

else:

logger.debug("Alignments file found: '%s'", self._alignments.file)

return None

logger.debug("Loading extractor")

logger.warning("On-The-Fly conversion selected. This will use the inferior cv2-dnn for "

"extraction and will produce poor results.")

logger.warning("It is recommended to generate an alignments file for your destination "

"video with Extract first for superior results.")

extractor = Extractor(detector="cv2-dnn",

aligner="cv2-dnn",

masker=self._args.mask_type,

multiprocess=True,

rotate_images=None,

min_size=20)

extractor.launch()

logger.debug("Loaded extractor")

return extractor

def _init_threads(self) -> None:

""" Initialize queues and threads.

Creates the load and save queues and the load and save threads. Starts the threads.

"""

logger.debug("Initializing DiskIO Threads")

for task in T.get_args(T.Literal["load", "save"]):

self._add_queue(task)

self._start_thread(task)

logger.debug("Initialized DiskIO Threads")

def _add_queue(self, task: T.Literal["load", "save"]) -> None:

""" Add the queue to queue_manager and to :attr:`self._queues` for the given task.

Parameters

----------

task: {"load", "save"}

The task that the queue is to be added for

"""

logger.debug("Adding queue for task: '%s'", task)

if task == "load":

q_name = "convert_in"

elif task == "save":

q_name = "convert_out"

else:

q_name = task

self._queues[task] = queue_manager.get_queue(q_name)

logger.debug("Added queue for task: '%s'", task)

def _start_thread(self, task: T.Literal["load", "save"]) -> None:

""" Create the thread for the given task, add it it :attr:`self._threads` and start it.

Parameters

----------

task: {"load", "save"}

The task that the thread is to be created for

"""

logger.debug("Starting thread: '%s'", task)

args = self._completion_event if task == "save" else None

func = getattr(self, f"_{task}")

io_thread = MultiThread(func, args, thread_count=1)

io_thread.start()

self._threads[task] = io_thread

logger.debug("Started thread: '%s'", task)

# Loading tasks

def _load(self, *args) -> None: # pylint:disable=unused-argument

""" Load frames from disk.

In a background thread:

* Loads frames from disk.

* Discards or passes through cli selected skipped frames

* Pairs the frame with its :class:`~lib.align.DetectedFace` objects

* Performs any pre-processing actions

* Puts the frame and detected faces to the load queue

"""

logger.debug("Load Images: Start")

idx = 0

for filename, image in self._images.load():

idx += 1

if self._queues["load"].shutdown.is_set():

logger.debug("Load Queue: Stop signal received. Terminating")

break

if image is None or (not image.any() and image.ndim not in (2, 3)):

# All black frames will return not numpy.any() so check dims too

logger.warning("Unable to open image. Skipping: '%s'", filename)

continue

if self._check_skipframe(filename):

if self._args.keep_unchanged:

logger.trace("Saving unchanged frame: %s", filename) # type:ignore

out_file = os.path.join(self._args.output_dir, os.path.basename(filename))

self._queues["save"].put((out_file, image))

else:

logger.trace("Discarding frame: '%s'", filename) # type:ignore

continue

detected_faces = self._get_detected_faces(filename, image)

item = ConvertItem(ExtractMedia(filename, image, detected_faces))

self._pre_process.do_actions(item.inbound)

self._queues["load"].put(item)

logger.debug("Putting EOF")

self._queues["load"].put("EOF")

logger.debug("Load Images: Complete")

def _check_skipframe(self, filename: str) -> bool:

""" Check whether a frame is to be skipped.

Parameters

----------

filename: str

The filename of the frame to check

Returns

-------

bool

``True`` if the frame is to be skipped otherwise ``False``

"""

if not self._frame_ranges:

return False

indices = self._imageidxre.findall(filename)

if not indices:

logger.warning("Could not determine frame number. Frame will be converted: '%s'",

filename)

return False

idx = int(indices[0])

skipframe = not any(map(lambda b: b[0] <= idx <= b[1], self._frame_ranges))

logger.trace("idx: %s, skipframe: %s", idx, skipframe) # type: ignore[attr-defined]

return skipframe

def _get_detected_faces(self, filename: str, image: np.ndarray) -> list[DetectedFace]:

""" Return the detected faces for the given image.

If we have an alignments file, then the detected faces are created from that file. If

we're running On-The-Fly then they will be extracted from the extractor.

Parameters

----------

filename: str

The filename to return the detected faces for

image: :class:`numpy.ndarray`

The frame that the detected faces exist in

Returns

-------

list

List of :class:`lib.align.DetectedFace` objects

"""

logger.trace("Getting faces for: '%s'", filename) # type:ignore

if not self._extractor:

detected_faces = self._alignments_faces(os.path.basename(filename), image)

else:

detected_faces = self._detect_faces(filename, image)

logger.trace("Got %s faces for: '%s'", len(detected_faces), filename) # type:ignore

return detected_faces

def _alignments_faces(self, frame_name: str, image: np.ndarray) -> list[DetectedFace]:

""" Return detected faces from an alignments file.

Parameters

----------

frame_name: str

The name of the frame to return the detected faces for

image: :class:`numpy.ndarray`

The frame that the detected faces exist in

Returns

-------

list

List of :class:`lib.align.DetectedFace` objects

"""

if not self._check_alignments(frame_name):

return []

faces = self._alignments.get_faces_in_frame(frame_name)

detected_faces = []

for rawface in faces:

face = DetectedFace()

face.from_alignment(rawface, image=image)

detected_faces.append(face)

return detected_faces

def _check_alignments(self, frame_name: str) -> bool:

""" Ensure that we have alignments for the current frame.

If we have no alignments for this image, skip it and output a message.

Parameters

----------

frame_name: str

The name of the frame to check that we have alignments for

Returns

-------

bool

``True`` if we have alignments for this face, otherwise ``False``

"""

have_alignments = self._alignments.frame_exists(frame_name)

if not have_alignments:

tqdm.write(f"No alignment found for {frame_name}, skipping")

return have_alignments

def _detect_faces(self, filename: str, image: np.ndarray) -> list[DetectedFace]:

""" Extract the face from a frame for On-The-Fly conversion.

Pulls detected faces out of the Extraction pipeline.

Parameters

----------

filename: str

The filename to return the detected faces for

image: :class:`numpy.ndarray`

The frame that the detected faces exist in

Returns

-------

list

List of :class:`lib.align.DetectedFace` objects

"""

assert self._extractor is not None

self._extractor.input_queue.put(ExtractMedia(filename, image))

faces = next(self._extractor.detected_faces())

return faces.detected_faces

# Saving tasks

def _save(self, completion_event: Event) -> None:

""" Save the converted images.

Puts the selected writer into a background thread and feeds it from the output of the

patch queue.

Parameters

----------

completion_event: :class:`event.Event`

An even that this process triggers when it has finished saving

"""

logger.debug("Save Images: Start")

write_preview = self._args.redirect_gui and self._writer.is_stream

preview_image = os.path.join(self._writer.output_folder, ".gui_preview.jpg")

logger.debug("Write preview for gui: %s", write_preview)

for idx in tqdm(range(self._total_count), desc="Converting", file=sys.stdout):

if self._queues["save"].shutdown.is_set():

logger.debug("Save Queue: Stop signal received. Terminating")

break

item: tuple[str, np.ndarray | bytes] | T.Literal["EOF"] = self._queues["save"].get()

if item == "EOF":

logger.debug("EOF Received")

break

filename, image = item

# Write out preview image for the GUI every 10 frames if writing to stream

if write_preview and idx % 10 == 0 and not os.path.exists(preview_image):

logger.debug("Writing GUI Preview image: '%s'", preview_image)

assert isinstance(image, np.ndarray)

cv2.imwrite(preview_image, image)

self._writer.write(filename, image)

self._writer.close()

completion_event.set()

logger.debug("Save Faces: Complete")

class Predict():

""" Obtains the output from the Faceswap model.

Parameters

----------

queue_size: int

The maximum size of the input queue

arguments: :class:`argparse.Namespace`

The arguments that were passed to the convert process as generated from Faceswap's command

line arguments

"""

def __init__(self, queue_size: int, arguments: Namespace) -> None:

logger.debug("Initializing %s: (args: %s, queue_size: %s)",

self.__class__.__name__, arguments, queue_size)

self._args = arguments

self._in_queue: EventQueue | None = None

self._out_queue = queue_manager.get_queue("patch")

self._serializer = get_serializer("json")

self._faces_count = 0

self._verify_output = False

self._model = self._load_model()

self._batchsize = self._get_batchsize(queue_size)

self._sizes = self._get_io_sizes()

self._coverage_ratio = self._model.coverage_ratio

self._centering = self._model.config["centering"]

self._thread: MultiThread | None = None

logger.debug("Initialized %s: (out_queue: %s)", self.__class__.__name__, self._out_queue)

@property

def thread(self) -> MultiThread:

""" :class:`~lib.multithreading.MultiThread`: The thread that is running the prediction

function from the Faceswap model. """

assert self._thread is not None

return self._thread

@property

def in_queue(self) -> EventQueue:

""" :class:`~lib.queue_manager.EventQueue`: The input queue to the predictor. """

assert self._in_queue is not None

return self._in_queue

@property

def out_queue(self) -> EventQueue:

""" :class:`~lib.queue_manager.EventQueue`: The output queue from the predictor. """

return self._out_queue

@property

def faces_count(self) -> int:

""" int: The total number of faces seen by the Predictor. """

return self._faces_count

@property

def verify_output(self) -> bool:

""" bool: ``True`` if multiple faces have been found in frames, otherwise ``False``. """

return self._verify_output

@property

def coverage_ratio(self) -> float:

""" float: The coverage ratio that the model was trained at. """

return self._coverage_ratio

@property

def centering(self) -> CenteringType:

""" str: The centering that the model was trained on (`"head", "face"` or `"legacy"`) """

return self._centering

@property

def has_predicted_mask(self) -> bool:

""" bool: ``True`` if the model was trained to learn a mask, otherwise ``False``. """

return bool(self._model.config.get("learn_mask", False))

@property

def output_size(self) -> int:

""" int: The size in pixels of the Faceswap model output. """

return self._sizes["output"]

def _get_io_sizes(self) -> dict[str, int]:

""" Obtain the input size and output size of the model.

Returns

-------

dict

input_size in pixels and output_size in pixels

"""

input_shape = self._model.model.input_shape

input_shape = [input_shape] if not isinstance(input_shape, list) else input_shape

output_shape = self._model.model.output_shape

output_shape = [output_shape] if not isinstance(output_shape, list) else output_shape

retval = {"input": input_shape[0][1], "output": output_shape[-1][1]}

logger.debug(retval)

return retval

def _load_model(self) -> ModelBase:

""" Load the Faceswap model.

Returns

-------

:mod:`plugins.train.model` plugin

The trained model in the specified model folder

"""

logger.debug("Loading Model")

model_dir = get_folder(self._args.model_dir, make_folder=False)

if not model_dir:

raise FaceswapError(f"{self._args.model_dir} does not exist.")

trainer = self._get_model_name(model_dir)

model = PluginLoader.get_model(trainer)(model_dir, self._args, predict=True)

model.build()

logger.debug("Loaded Model")

return model

def _get_batchsize(self, queue_size: int) -> int:

""" Get the batch size for feeding the model.

Sets the batch size to 1 if inference is being run on CPU, otherwise the minimum of the

input queue size and the model's `convert_batchsize` configuration option.

Parameters

----------

queue_size: int

The queue size that is feeding the predictor

Returns

-------

int

The batch size that the model is to be fed at.

"""

logger.debug("Getting batchsize")

is_cpu = GPUStats().device_count == 0

batchsize = 1 if is_cpu else self._model.config["convert_batchsize"]

batchsize = min(queue_size, batchsize)

logger.debug("Got batchsize: %s", batchsize)

return batchsize

def _get_model_name(self, model_dir: str) -> str:

""" Return the name of the Faceswap model used.

Retrieve the name of the model from the model's state file.

Parameters

----------

model_dir: str

The folder that contains the trained Faceswap model

Returns

-------

str

The name of the Faceswap model being used.

"""

statefiles = [fname for fname in os.listdir(str(model_dir))

if fname.endswith("_state.json")]

if len(statefiles) != 1:

raise FaceswapError("There should be 1 state file in your model folder. "

f"{len(statefiles)} were found.")

statefile = os.path.join(str(model_dir), statefiles[0])

state = self._serializer.load(statefile)

trainer = state.get("name", None)

if not trainer:

raise FaceswapError("Trainer name could not be read from state file.")

logger.debug("Trainer from state file: '%s'", trainer)

return trainer

def launch(self, load_queue: EventQueue) -> None:

""" Launch the prediction process in a background thread.

Starts the prediction thread and returns the thread.

Parameters

----------

load_queue: :class:`~lib.queue_manager.EventQueue`

The queue that contains images and detected faces for feeding the model

"""

self._in_queue = load_queue

self._thread = MultiThread(self._predict_faces, thread_count=1)

self._thread.start()

def _predict_faces(self) -> None:

""" Run Prediction on the Faceswap model in a background thread.

Reads from the :attr:`self._in_queue`, prepares images for prediction

then puts the predictions back to the :attr:`self.out_queue`

"""

faces_seen = 0

consecutive_no_faces = 0

batch: list[ConvertItem] = []

assert self._in_queue is not None

while True:

item: T.Literal["EOF"] | ConvertItem = self._in_queue.get()

if item == "EOF":

logger.debug("EOF Received")

if batch: # Process out any remaining items

self._process_batch(batch, faces_seen)

break

logger.trace("Got from queue: '%s'", item.inbound.filename) # type:ignore

faces_count = len(item.inbound.detected_faces)

# Safety measure. If a large stream of frames appear that do not have faces,

# these will stack up into RAM. Keep a count of consecutive frames with no faces.

# If self._batchsize number of frames appear, force the current batch through

# to clear RAM.

consecutive_no_faces = consecutive_no_faces + 1 if faces_count == 0 else 0

self._faces_count += faces_count

if faces_count > 1:

self._verify_output = True

logger.verbose("Found more than one face in an image! '%s'", # type:ignore

os.path.basename(item.inbound.filename))

self.load_aligned(item)

faces_seen += faces_count

batch.append(item)

if faces_seen < self._batchsize and consecutive_no_faces < self._batchsize:

logger.trace("Continuing. Current batchsize: %s, " # type:ignore

"consecutive_no_faces: %s", faces_seen, consecutive_no_faces)

continue

self._process_batch(batch, faces_seen)

consecutive_no_faces = 0

faces_seen = 0

batch = []

logger.debug("Putting EOF")

self._out_queue.put("EOF")

logger.debug("Load queue complete")

def _process_batch(self, batch: list[ConvertItem], faces_seen: int):

""" Predict faces on the given batch of images and queue out to patch thread

Parameters

----------

batch: list

List of :class:`ConvertItem` objects for the current batch

faces_seen: int

The number of faces seen in the current batch

Returns

-------

:class:`np.narray`

The predicted faces for the current batch

"""

logger.trace("Batching to predictor. Frames: %s, Faces: %s", # type:ignore

len(batch), faces_seen)

feed_batch = [feed_face for item in batch for feed_face in item.feed_faces]

if faces_seen != 0:

feed_faces = self._compile_feed_faces(feed_batch)

batch_size = None

predicted = self._predict(feed_faces, batch_size)

else:

predicted = np.array([])

self._queue_out_frames(batch, predicted)

def load_aligned(self, item: ConvertItem) -> None:

""" Load the model's feed faces and the reference output faces.

For each detected face in the incoming item, load the feed face and reference face

images, correctly sized for input and output respectively.

Parameters

----------

item: :class:`ConvertMedia`

The convert media object, containing the ExctractMedia for the current image

"""

logger.trace("Loading aligned faces: '%s'", item.inbound.filename) # type:ignore

feed_faces = []

reference_faces = []

for detected_face in item.inbound.detected_faces:

feed_face = AlignedFace(detected_face.landmarks_xy,

image=item.inbound.image,

centering=self._centering,

View remainder of file in raw view

Provide feedback

Saved searches

Use saved searches to filter your results more quickly

FilesExpand file tree

convert.py

Latest commit

History

convert.py

File metadata and controls