diff --git a/.flake8 b/.flake8 new file mode 100644 index 0000000000000000000000000000000000000000..4c9027e764444c3296a3c9aabf219a65cabe46bd --- /dev/null +++ b/.flake8 @@ -0,0 +1,3 @@ +[flake8] +select = E3, E4, F +per-file-ignores = roop/core.py:E402,F401 \ No newline at end of file diff --git a/.gitattributes b/.gitattributes index a6344aac8c09253b3b630fb776ae94478aa0275b..542a48fd52c6305ccd73639b58464b070bd5963c 100644 --- a/.gitattributes +++ b/.gitattributes @@ -33,3 +33,8 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text *.zip filter=lfs diff=lfs merge=lfs -text *.zst filter=lfs diff=lfs merge=lfs -text *tfevents* filter=lfs diff=lfs merge=lfs -text +.github/examples/snapshot.mp4 filter=lfs diff=lfs merge=lfs -text +.github/preview/output.gif filter=lfs diff=lfs merge=lfs -text +.github/preview/target.gif filter=lfs diff=lfs merge=lfs -text +uploads/1685074910001_vtqikl_2_0.jpg filter=lfs diff=lfs merge=lfs -text +uploads/20230518_174347_0000.png filter=lfs diff=lfs merge=lfs -text diff --git a/.github/FUNDING.yml b/.github/FUNDING.yml new file mode 100644 index 0000000000000000000000000000000000000000..a3f27d05ba7d8e7d8a025c372e4542e87861b7fb --- /dev/null +++ b/.github/FUNDING.yml @@ -0,0 +1,2 @@ +github: [s0md3v, henryruhs] +custom: [https://paypal.me/s0md3v, https://paypal.me/henryruhs] diff --git a/.github/ISSUE_TEMPLATE/bug.md b/.github/ISSUE_TEMPLATE/bug.md new file mode 100644 index 0000000000000000000000000000000000000000..a0f9c2ea981873f2462a95e1607c5674397c2f43 --- /dev/null +++ b/.github/ISSUE_TEMPLATE/bug.md @@ -0,0 +1,47 @@ +--- +name: Bug +about: Report a bug +labels: 'bug' + +--- + +## Description + +A concise description of the bug and how to reproduce it. + +## Error + +Paste the error or exception from your console: + +``` + +``` + +## Details + +What operating system are you using? + +- [ ] Windows +- [ ] MacOS (Apple Silicon) +- [ ] MacOS (Apple Legacy) +- [ ] Linux +- [ ] Linux in WSL + +What execution provider are you using? + +- [ ] CPU +- [ ] CUDA +- [ ] CoreML +- [ ] DirectML +- [ ] OpenVINO +- [ ] Other + +What version of Roop are you using? + +- [ ] 1.0.0 +- [ ] 1.1.0 +- [ ] 1.2.0 +- [ ] 1.3.0 +- [ ] 1.3.1 +- [ ] 1.3.2 +- [ ] next diff --git a/.github/ISSUE_TEMPLATE/installation.md b/.github/ISSUE_TEMPLATE/installation.md new file mode 100644 index 0000000000000000000000000000000000000000..5b1e96b04c98d16517505e7f2cd195a25c21a0d8 --- /dev/null +++ b/.github/ISSUE_TEMPLATE/installation.md @@ -0,0 +1,8 @@ +--- +name: Installation +about: Platform and installation issues +labels: 'installation' + +--- + +Please **DO NOT OPEN** platform and installation issues! diff --git a/.github/examples/snapshot.mp4 b/.github/examples/snapshot.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..dbf23f3278a97d4b936a67262777044c6670deb0 --- /dev/null +++ b/.github/examples/snapshot.mp4 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6021bee403a32b33b9d0b12916fcc40fee520681910a3faaef4b1f7e66ee386e +size 2435482 diff --git a/.github/examples/source.jpg b/.github/examples/source.jpg new file mode 100644 index 0000000000000000000000000000000000000000..bdaa5e4429625621de84f547fc5aca19cc26e2b8 Binary files /dev/null and b/.github/examples/source.jpg differ diff --git a/.github/examples/target.mp4 b/.github/examples/target.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..a8f3f6f27942c247a99e7a2372b45132ec7fa693 Binary files /dev/null and b/.github/examples/target.mp4 differ diff --git a/.github/preview/output.gif b/.github/preview/output.gif new file mode 100644 index 0000000000000000000000000000000000000000..cb1a320f03f2b1446096c52349fc92f8ec1fced9 --- /dev/null +++ b/.github/preview/output.gif @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:49bf3696cd628b26a881571ca7e04f3256ba0378fc1c36991c55b49133d31dfd +size 3634769 diff --git a/.github/preview/target.gif b/.github/preview/target.gif new file mode 100644 index 0000000000000000000000000000000000000000..36974a107b217024cde75bdbc9e76245012871b3 --- /dev/null +++ b/.github/preview/target.gif @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d8bf5c612b2d4667c7a0274128bca561282e8ec349feff75fa691bb2580feefd +size 3296066 diff --git a/.github/workflows/ci.yml b/.github/workflows/ci.yml new file mode 100644 index 0000000000000000000000000000000000000000..cefc64ffccc7250fa01a9931663e5dd98634a335 --- /dev/null +++ b/.github/workflows/ci.yml @@ -0,0 +1,41 @@ +name: ci + +on: [ push, pull_request ] + +jobs: + lint: + runs-on: ubuntu-latest + steps: + - name: Checkout + uses: actions/checkout@v2 + - name: Set up Python 3.9 + uses: actions/setup-python@v2 + with: + python-version: 3.9 + - run: pip install flake8 + - run: pip install mypy + - run: flake8 run.py roop + - run: mypy run.py roop + test: + strategy: + matrix: + os: [macos-latest, ubuntu-latest, windows-latest] + runs-on: ${{ matrix.os }} + steps: + - name: Checkout + uses: actions/checkout@v2 + - name: Set up ffmpeg + uses: FedericoCarboni/setup-ffmpeg@v2 + - name: Set up Python 3.9 + uses: actions/setup-python@v2 + with: + python-version: 3.9 + - run: pip install -r requirements-headless.txt + - run: python run.py -s .github/examples/source.jpg -t .github/examples/target.mp4 -o .github/examples/output.mp4 + if: matrix.os != 'windows-latest' + - run: python run.py -s .github\examples\source.jpg -t .github\examples\target.mp4 -o .github\examples\output.mp4 + if: matrix.os == 'windows-latest' + - run: ffmpeg -i .github/examples/snapshot.mp4 -i .github/examples/output.mp4 -filter_complex psnr -f null - + if: matrix.os != 'windows-latest' + - run: ffmpeg -i .github\examples\snapshot.mp4 -i .github\examples\output.mp4 -filter_complex psnr -f null - + if: matrix.os == 'windows-latest' diff --git a/.gitignore b/.gitignore new file mode 100644 index 0000000000000000000000000000000000000000..e25e7ce3b357ca8351e9cc14070959b4e63ed3d7 --- /dev/null +++ b/.gitignore @@ -0,0 +1,4 @@ +.idea +models +temp +__pycache__ diff --git a/CONTRIBUTING.md b/CONTRIBUTING.md new file mode 100644 index 0000000000000000000000000000000000000000..da18ab471e305bae02a9216680110547a24e1790 --- /dev/null +++ b/CONTRIBUTING.md @@ -0,0 +1,25 @@ +## Pull Requests + +Before submitting a pull request, please ensure to align with us as we need to establish both technical and business requirements. + + +### Do + +- ...consider to fix bugs over adding features +- ...one pull request for one feature or improvement +- ...consult us about implementation details +- ...proper testing before you submit your code +- ...resolve failed CI pipelines + + +### Don't + +- ...introduce fundamental changes in terms of software architecture +- ...introduce OOP - we accept functional programming only +- ...ignore given requirements or try to work around them +- ...submit code to a development branch without consulting us +- ...submit massive amount of code changes +- ...submit a proof of concept +- ...submit code that is using undocumented and private APIs +- ...solve third party issues in our project +- ...comment what your code does - use proper naming instead diff --git a/LICENSE b/LICENSE new file mode 100644 index 0000000000000000000000000000000000000000..f288702d2fa16d3cdf0035b15a9fcbc552cd88e7 --- /dev/null +++ b/LICENSE @@ -0,0 +1,674 @@ + GNU GENERAL PUBLIC LICENSE + Version 3, 29 June 2007 + + Copyright (C) 2007 Free Software Foundation, Inc. <https://fsf.org/> + Everyone is permitted to copy and distribute verbatim copies + of this license document, but changing it is not allowed. + + Preamble + + The GNU General Public License is a free, copyleft license for +software and other kinds of works. + + The licenses for most software and other practical works are designed +to take away your freedom to share and change the works. By contrast, +the GNU General Public License is intended to guarantee your freedom to +share and change all versions of a program--to make sure it remains free +software for all its users. We, the Free Software Foundation, use the +GNU General Public License for most of our software; it applies also to +any other work released this way by its authors. You can apply it to +your programs, too. + + When we speak of free software, we are referring to freedom, not +price. Our General Public Licenses are designed to make sure that you +have the freedom to distribute copies of free software (and charge for +them if you wish), that you receive source code or can get it if you +want it, that you can change the software or use pieces of it in new +free programs, and that you know you can do these things. + + To protect your rights, we need to prevent others from denying you +these rights or asking you to surrender the rights. Therefore, you have +certain responsibilities if you distribute copies of the software, or if +you modify it: responsibilities to respect the freedom of others. + + For example, if you distribute copies of such a program, whether +gratis or for a fee, you must pass on to the recipients the same +freedoms that you received. You must make sure that they, too, receive +or can get the source code. And you must show them these terms so they +know their rights. + + Developers that use the GNU GPL protect your rights with two steps: +(1) assert copyright on the software, and (2) offer you this License +giving you legal permission to copy, distribute and/or modify it. + + For the developers' and authors' protection, the GPL clearly explains +that there is no warranty for this free software. For both users' and +authors' sake, the GPL requires that modified versions be marked as +changed, so that their problems will not be attributed erroneously to +authors of previous versions. + + Some devices are designed to deny users access to install or run +modified versions of the software inside them, although the manufacturer +can do so. This is fundamentally incompatible with the aim of +protecting users' freedom to change the software. The systematic +pattern of such abuse occurs in the area of products for individuals to +use, which is precisely where it is most unacceptable. Therefore, we +have designed this version of the GPL to prohibit the practice for those +products. If such problems arise substantially in other domains, we +stand ready to extend this provision to those domains in future versions +of the GPL, as needed to protect the freedom of users. + + Finally, every program is threatened constantly by software patents. +States should not allow patents to restrict development and use of +software on general-purpose computers, but in those that do, we wish to +avoid the special danger that patents applied to a free program could +make it effectively proprietary. To prevent this, the GPL assures that +patents cannot be used to render the program non-free. + + The precise terms and conditions for copying, distribution and +modification follow. + + TERMS AND CONDITIONS + + 0. Definitions. + + "This License" refers to version 3 of the GNU General Public License. + + "Copyright" also means copyright-like laws that apply to other kinds of +works, such as semiconductor masks. + + "The Program" refers to any copyrightable work licensed under this +License. Each licensee is addressed as "you". "Licensees" and +"recipients" may be individuals or organizations. + + To "modify" a work means to copy from or adapt all or part of the work +in a fashion requiring copyright permission, other than the making of an +exact copy. The resulting work is called a "modified version" of the +earlier work or a work "based on" the earlier work. + + A "covered work" means either the unmodified Program or a work based +on the Program. + + To "propagate" a work means to do anything with it that, without +permission, would make you directly or secondarily liable for +infringement under applicable copyright law, except executing it on a +computer or modifying a private copy. Propagation includes copying, +distribution (with or without modification), making available to the +public, and in some countries other activities as well. + + To "convey" a work means any kind of propagation that enables other +parties to make or receive copies. Mere interaction with a user through +a computer network, with no transfer of a copy, is not conveying. + + An interactive user interface displays "Appropriate Legal Notices" +to the extent that it includes a convenient and prominently visible +feature that (1) displays an appropriate copyright notice, and (2) +tells the user that there is no warranty for the work (except to the +extent that warranties are provided), that licensees may convey the +work under this License, and how to view a copy of this License. If +the interface presents a list of user commands or options, such as a +menu, a prominent item in the list meets this criterion. + + 1. Source Code. + + The "source code" for a work means the preferred form of the work +for making modifications to it. "Object code" means any non-source +form of a work. + + A "Standard Interface" means an interface that either is an official +standard defined by a recognized standards body, or, in the case of +interfaces specified for a particular programming language, one that +is widely used among developers working in that language. + + The "System Libraries" of an executable work include anything, other +than the work as a whole, that (a) is included in the normal form of +packaging a Major Component, but which is not part of that Major +Component, and (b) serves only to enable use of the work with that +Major Component, or to implement a Standard Interface for which an +implementation is available to the public in source code form. A +"Major Component", in this context, means a major essential component +(kernel, window system, and so on) of the specific operating system +(if any) on which the executable work runs, or a compiler used to +produce the work, or an object code interpreter used to run it. + + The "Corresponding Source" for a work in object code form means all +the source code needed to generate, install, and (for an executable +work) run the object code and to modify the work, including scripts to +control those activities. However, it does not include the work's +System Libraries, or general-purpose tools or generally available free +programs which are used unmodified in performing those activities but +which are not part of the work. For example, Corresponding Source +includes interface definition files associated with source files for +the work, and the source code for shared libraries and dynamically +linked subprograms that the work is specifically designed to require, +such as by intimate data communication or control flow between those +subprograms and other parts of the work. + + The Corresponding Source need not include anything that users +can regenerate automatically from other parts of the Corresponding +Source. + + The Corresponding Source for a work in source code form is that +same work. + + 2. Basic Permissions. + + All rights granted under this License are granted for the term of +copyright on the Program, and are irrevocable provided the stated +conditions are met. This License explicitly affirms your unlimited +permission to run the unmodified Program. The output from running a +covered work is covered by this License only if the output, given its +content, constitutes a covered work. This License acknowledges your +rights of fair use or other equivalent, as provided by copyright law. + + You may make, run and propagate covered works that you do not +convey, without conditions so long as your license otherwise remains +in force. You may convey covered works to others for the sole purpose +of having them make modifications exclusively for you, or provide you +with facilities for running those works, provided that you comply with +the terms of this License in conveying all material for which you do +not control copyright. Those thus making or running the covered works +for you must do so exclusively on your behalf, under your direction +and control, on terms that prohibit them from making any copies of +your copyrighted material outside their relationship with you. + + Conveying under any other circumstances is permitted solely under +the conditions stated below. Sublicensing is not allowed; section 10 +makes it unnecessary. + + 3. Protecting Users' Legal Rights From Anti-Circumvention Law. + + No covered work shall be deemed part of an effective technological +measure under any applicable law fulfilling obligations under article +11 of the WIPO copyright treaty adopted on 20 December 1996, or +similar laws prohibiting or restricting circumvention of such +measures. + + When you convey a covered work, you waive any legal power to forbid +circumvention of technological measures to the extent such circumvention +is effected by exercising rights under this License with respect to +the covered work, and you disclaim any intention to limit operation or +modification of the work as a means of enforcing, against the work's +users, your or third parties' legal rights to forbid circumvention of +technological measures. + + 4. Conveying Verbatim Copies. + + You may convey verbatim copies of the Program's source code as you +receive it, in any medium, provided that you conspicuously and +appropriately publish on each copy an appropriate copyright notice; +keep intact all notices stating that this License and any +non-permissive terms added in accord with section 7 apply to the code; +keep intact all notices of the absence of any warranty; and give all +recipients a copy of this License along with the Program. + + You may charge any price or no price for each copy that you convey, +and you may offer support or warranty protection for a fee. + + 5. Conveying Modified Source Versions. + + You may convey a work based on the Program, or the modifications to +produce it from the Program, in the form of source code under the +terms of section 4, provided that you also meet all of these conditions: + + a) The work must carry prominent notices stating that you modified + it, and giving a relevant date. + + b) The work must carry prominent notices stating that it is + released under this License and any conditions added under section + 7. This requirement modifies the requirement in section 4 to + "keep intact all notices". + + c) You must license the entire work, as a whole, under this + License to anyone who comes into possession of a copy. This + License will therefore apply, along with any applicable section 7 + additional terms, to the whole of the work, and all its parts, + regardless of how they are packaged. This License gives no + permission to license the work in any other way, but it does not + invalidate such permission if you have separately received it. + + d) If the work has interactive user interfaces, each must display + Appropriate Legal Notices; however, if the Program has interactive + interfaces that do not display Appropriate Legal Notices, your + work need not make them do so. + + A compilation of a covered work with other separate and independent +works, which are not by their nature extensions of the covered work, +and which are not combined with it such as to form a larger program, +in or on a volume of a storage or distribution medium, is called an +"aggregate" if the compilation and its resulting copyright are not +used to limit the access or legal rights of the compilation's users +beyond what the individual works permit. Inclusion of a covered work +in an aggregate does not cause this License to apply to the other +parts of the aggregate. + + 6. Conveying Non-Source Forms. + + You may convey a covered work in object code form under the terms +of sections 4 and 5, provided that you also convey the +machine-readable Corresponding Source under the terms of this License, +in one of these ways: + + a) Convey the object code in, or embodied in, a physical product + (including a physical distribution medium), accompanied by the + Corresponding Source fixed on a durable physical medium + customarily used for software interchange. + + b) Convey the object code in, or embodied in, a physical product + (including a physical distribution medium), accompanied by a + written offer, valid for at least three years and valid for as + long as you offer spare parts or customer support for that product + model, to give anyone who possesses the object code either (1) a + copy of the Corresponding Source for all the software in the + product that is covered by this License, on a durable physical + medium customarily used for software interchange, for a price no + more than your reasonable cost of physically performing this + conveying of source, or (2) access to copy the + Corresponding Source from a network server at no charge. + + c) Convey individual copies of the object code with a copy of the + written offer to provide the Corresponding Source. This + alternative is allowed only occasionally and noncommercially, and + only if you received the object code with such an offer, in accord + with subsection 6b. + + d) Convey the object code by offering access from a designated + place (gratis or for a charge), and offer equivalent access to the + Corresponding Source in the same way through the same place at no + further charge. You need not require recipients to copy the + Corresponding Source along with the object code. If the place to + copy the object code is a network server, the Corresponding Source + may be on a different server (operated by you or a third party) + that supports equivalent copying facilities, provided you maintain + clear directions next to the object code saying where to find the + Corresponding Source. Regardless of what server hosts the + Corresponding Source, you remain obligated to ensure that it is + available for as long as needed to satisfy these requirements. + + e) Convey the object code using peer-to-peer transmission, provided + you inform other peers where the object code and Corresponding + Source of the work are being offered to the general public at no + charge under subsection 6d. + + A separable portion of the object code, whose source code is excluded +from the Corresponding Source as a System Library, need not be +included in conveying the object code work. + + A "User Product" is either (1) a "consumer product", which means any +tangible personal property which is normally used for personal, family, +or household purposes, or (2) anything designed or sold for incorporation +into a dwelling. In determining whether a product is a consumer product, +doubtful cases shall be resolved in favor of coverage. For a particular +product received by a particular user, "normally used" refers to a +typical or common use of that class of product, regardless of the status +of the particular user or of the way in which the particular user +actually uses, or expects or is expected to use, the product. A product +is a consumer product regardless of whether the product has substantial +commercial, industrial or non-consumer uses, unless such uses represent +the only significant mode of use of the product. + + "Installation Information" for a User Product means any methods, +procedures, authorization keys, or other information required to install +and execute modified versions of a covered work in that User Product from +a modified version of its Corresponding Source. The information must +suffice to ensure that the continued functioning of the modified object +code is in no case prevented or interfered with solely because +modification has been made. + + If you convey an object code work under this section in, or with, or +specifically for use in, a User Product, and the conveying occurs as +part of a transaction in which the right of possession and use of the +User Product is transferred to the recipient in perpetuity or for a +fixed term (regardless of how the transaction is characterized), the +Corresponding Source conveyed under this section must be accompanied +by the Installation Information. But this requirement does not apply +if neither you nor any third party retains the ability to install +modified object code on the User Product (for example, the work has +been installed in ROM). + + The requirement to provide Installation Information does not include a +requirement to continue to provide support service, warranty, or updates +for a work that has been modified or installed by the recipient, or for +the User Product in which it has been modified or installed. Access to a +network may be denied when the modification itself materially and +adversely affects the operation of the network or violates the rules and +protocols for communication across the network. + + Corresponding Source conveyed, and Installation Information provided, +in accord with this section must be in a format that is publicly +documented (and with an implementation available to the public in +source code form), and must require no special password or key for +unpacking, reading or copying. + + 7. Additional Terms. + + "Additional permissions" are terms that supplement the terms of this +License by making exceptions from one or more of its conditions. +Additional permissions that are applicable to the entire Program shall +be treated as though they were included in this License, to the extent +that they are valid under applicable law. If additional permissions +apply only to part of the Program, that part may be used separately +under those permissions, but the entire Program remains governed by +this License without regard to the additional permissions. + + When you convey a copy of a covered work, you may at your option +remove any additional permissions from that copy, or from any part of +it. (Additional permissions may be written to require their own +removal in certain cases when you modify the work.) You may place +additional permissions on material, added by you to a covered work, +for which you have or can give appropriate copyright permission. + + Notwithstanding any other provision of this License, for material you +add to a covered work, you may (if authorized by the copyright holders of +that material) supplement the terms of this License with terms: + + a) Disclaiming warranty or limiting liability differently from the + terms of sections 15 and 16 of this License; or + + b) Requiring preservation of specified reasonable legal notices or + author attributions in that material or in the Appropriate Legal + Notices displayed by works containing it; or + + c) Prohibiting misrepresentation of the origin of that material, or + requiring that modified versions of such material be marked in + reasonable ways as different from the original version; or + + d) Limiting the use for publicity purposes of names of licensors or + authors of the material; or + + e) Declining to grant rights under trademark law for use of some + trade names, trademarks, or service marks; or + + f) Requiring indemnification of licensors and authors of that + material by anyone who conveys the material (or modified versions of + it) with contractual assumptions of liability to the recipient, for + any liability that these contractual assumptions directly impose on + those licensors and authors. + + All other non-permissive additional terms are considered "further +restrictions" within the meaning of section 10. If the Program as you +received it, or any part of it, contains a notice stating that it is +governed by this License along with a term that is a further +restriction, you may remove that term. If a license document contains +a further restriction but permits relicensing or conveying under this +License, you may add to a covered work material governed by the terms +of that license document, provided that the further restriction does +not survive such relicensing or conveying. + + If you add terms to a covered work in accord with this section, you +must place, in the relevant source files, a statement of the +additional terms that apply to those files, or a notice indicating +where to find the applicable terms. + + Additional terms, permissive or non-permissive, may be stated in the +form of a separately written license, or stated as exceptions; +the above requirements apply either way. + + 8. Termination. + + You may not propagate or modify a covered work except as expressly +provided under this License. Any attempt otherwise to propagate or +modify it is void, and will automatically terminate your rights under +this License (including any patent licenses granted under the third +paragraph of section 11). + + However, if you cease all violation of this License, then your +license from a particular copyright holder is reinstated (a) +provisionally, unless and until the copyright holder explicitly and +finally terminates your license, and (b) permanently, if the copyright +holder fails to notify you of the violation by some reasonable means +prior to 60 days after the cessation. + + Moreover, your license from a particular copyright holder is +reinstated permanently if the copyright holder notifies you of the +violation by some reasonable means, this is the first time you have +received notice of violation of this License (for any work) from that +copyright holder, and you cure the violation prior to 30 days after +your receipt of the notice. + + Termination of your rights under this section does not terminate the +licenses of parties who have received copies or rights from you under +this License. If your rights have been terminated and not permanently +reinstated, you do not qualify to receive new licenses for the same +material under section 10. + + 9. Acceptance Not Required for Having Copies. + + You are not required to accept this License in order to receive or +run a copy of the Program. Ancillary propagation of a covered work +occurring solely as a consequence of using peer-to-peer transmission +to receive a copy likewise does not require acceptance. However, +nothing other than this License grants you permission to propagate or +modify any covered work. These actions infringe copyright if you do +not accept this License. Therefore, by modifying or propagating a +covered work, you indicate your acceptance of this License to do so. + + 10. Automatic Licensing of Downstream Recipients. + + Each time you convey a covered work, the recipient automatically +receives a license from the original licensors, to run, modify and +propagate that work, subject to this License. You are not responsible +for enforcing compliance by third parties with this License. + + An "entity transaction" is a transaction transferring control of an +organization, or substantially all assets of one, or subdividing an +organization, or merging organizations. If propagation of a covered +work results from an entity transaction, each party to that +transaction who receives a copy of the work also receives whatever +licenses to the work the party's predecessor in interest had or could +give under the previous paragraph, plus a right to possession of the +Corresponding Source of the work from the predecessor in interest, if +the predecessor has it or can get it with reasonable efforts. + + You may not impose any further restrictions on the exercise of the +rights granted or affirmed under this License. For example, you may +not impose a license fee, royalty, or other charge for exercise of +rights granted under this License, and you may not initiate litigation +(including a cross-claim or counterclaim in a lawsuit) alleging that +any patent claim is infringed by making, using, selling, offering for +sale, or importing the Program or any portion of it. + + 11. Patents. + + A "contributor" is a copyright holder who authorizes use under this +License of the Program or a work on which the Program is based. The +work thus licensed is called the contributor's "contributor version". + + A contributor's "essential patent claims" are all patent claims +owned or controlled by the contributor, whether already acquired or +hereafter acquired, that would be infringed by some manner, permitted +by this License, of making, using, or selling its contributor version, +but do not include claims that would be infringed only as a +consequence of further modification of the contributor version. For +purposes of this definition, "control" includes the right to grant +patent sublicenses in a manner consistent with the requirements of +this License. + + Each contributor grants you a non-exclusive, worldwide, royalty-free +patent license under the contributor's essential patent claims, to +make, use, sell, offer for sale, import and otherwise run, modify and +propagate the contents of its contributor version. + + In the following three paragraphs, a "patent license" is any express +agreement or commitment, however denominated, not to enforce a patent +(such as an express permission to practice a patent or covenant not to +sue for patent infringement). To "grant" such a patent license to a +party means to make such an agreement or commitment not to enforce a +patent against the party. + + If you convey a covered work, knowingly relying on a patent license, +and the Corresponding Source of the work is not available for anyone +to copy, free of charge and under the terms of this License, through a +publicly available network server or other readily accessible means, +then you must either (1) cause the Corresponding Source to be so +available, or (2) arrange to deprive yourself of the benefit of the +patent license for this particular work, or (3) arrange, in a manner +consistent with the requirements of this License, to extend the patent +license to downstream recipients. "Knowingly relying" means you have +actual knowledge that, but for the patent license, your conveying the +covered work in a country, or your recipient's use of the covered work +in a country, would infringe one or more identifiable patents in that +country that you have reason to believe are valid. + + If, pursuant to or in connection with a single transaction or +arrangement, you convey, or propagate by procuring conveyance of, a +covered work, and grant a patent license to some of the parties +receiving the covered work authorizing them to use, propagate, modify +or convey a specific copy of the covered work, then the patent license +you grant is automatically extended to all recipients of the covered +work and works based on it. + + A patent license is "discriminatory" if it does not include within +the scope of its coverage, prohibits the exercise of, or is +conditioned on the non-exercise of one or more of the rights that are +specifically granted under this License. You may not convey a covered +work if you are a party to an arrangement with a third party that is +in the business of distributing software, under which you make payment +to the third party based on the extent of your activity of conveying +the work, and under which the third party grants, to any of the +parties who would receive the covered work from you, a discriminatory +patent license (a) in connection with copies of the covered work +conveyed by you (or copies made from those copies), or (b) primarily +for and in connection with specific products or compilations that +contain the covered work, unless you entered into that arrangement, +or that patent license was granted, prior to 28 March 2007. + + Nothing in this License shall be construed as excluding or limiting +any implied license or other defenses to infringement that may +otherwise be available to you under applicable patent law. + + 12. No Surrender of Others' Freedom. + + If conditions are imposed on you (whether by court order, agreement or +otherwise) that contradict the conditions of this License, they do not +excuse you from the conditions of this License. If you cannot convey a +covered work so as to satisfy simultaneously your obligations under this +License and any other pertinent obligations, then as a consequence you may +not convey it at all. For example, if you agree to terms that obligate you +to collect a royalty for further conveying from those to whom you convey +the Program, the only way you could satisfy both those terms and this +License would be to refrain entirely from conveying the Program. + + 13. Use with the GNU Affero General Public License. + + Notwithstanding any other provision of this License, you have +permission to link or combine any covered work with a work licensed +under version 3 of the GNU Affero General Public License into a single +combined work, and to convey the resulting work. The terms of this +License will continue to apply to the part which is the covered work, +but the special requirements of the GNU Affero General Public License, +section 13, concerning interaction through a network will apply to the +combination as such. + + 14. Revised Versions of this License. + + The Free Software Foundation may publish revised and/or new versions of +the GNU General Public License from time to time. Such new versions will +be similar in spirit to the present version, but may differ in detail to +address new problems or concerns. + + Each version is given a distinguishing version number. If the +Program specifies that a certain numbered version of the GNU General +Public License "or any later version" applies to it, you have the +option of following the terms and conditions either of that numbered +version or of any later version published by the Free Software +Foundation. If the Program does not specify a version number of the +GNU General Public License, you may choose any version ever published +by the Free Software Foundation. + + If the Program specifies that a proxy can decide which future +versions of the GNU General Public License can be used, that proxy's +public statement of acceptance of a version permanently authorizes you +to choose that version for the Program. + + Later license versions may give you additional or different +permissions. However, no additional obligations are imposed on any +author or copyright holder as a result of your choosing to follow a +later version. + + 15. Disclaimer of Warranty. + + THERE IS NO WARRANTY FOR THE PROGRAM, TO THE EXTENT PERMITTED BY +APPLICABLE LAW. EXCEPT WHEN OTHERWISE STATED IN WRITING THE COPYRIGHT +HOLDERS AND/OR OTHER PARTIES PROVIDE THE PROGRAM "AS IS" WITHOUT WARRANTY +OF ANY KIND, EITHER EXPRESSED OR IMPLIED, INCLUDING, BUT NOT LIMITED TO, +THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR +PURPOSE. THE ENTIRE RISK AS TO THE QUALITY AND PERFORMANCE OF THE PROGRAM +IS WITH YOU. SHOULD THE PROGRAM PROVE DEFECTIVE, YOU ASSUME THE COST OF +ALL NECESSARY SERVICING, REPAIR OR CORRECTION. + + 16. Limitation of Liability. + + IN NO EVENT UNLESS REQUIRED BY APPLICABLE LAW OR AGREED TO IN WRITING +WILL ANY COPYRIGHT HOLDER, OR ANY OTHER PARTY WHO MODIFIES AND/OR CONVEYS +THE PROGRAM AS PERMITTED ABOVE, BE LIABLE TO YOU FOR DAMAGES, INCLUDING ANY +GENERAL, SPECIAL, INCIDENTAL OR CONSEQUENTIAL DAMAGES ARISING OUT OF THE +USE OR INABILITY TO USE THE PROGRAM (INCLUDING BUT NOT LIMITED TO LOSS OF +DATA OR DATA BEING RENDERED INACCURATE OR LOSSES SUSTAINED BY YOU OR THIRD +PARTIES OR A FAILURE OF THE PROGRAM TO OPERATE WITH ANY OTHER PROGRAMS), +EVEN IF SUCH HOLDER OR OTHER PARTY HAS BEEN ADVISED OF THE POSSIBILITY OF +SUCH DAMAGES. + + 17. Interpretation of Sections 15 and 16. + + If the disclaimer of warranty and limitation of liability provided +above cannot be given local legal effect according to their terms, +reviewing courts shall apply local law that most closely approximates +an absolute waiver of all civil liability in connection with the +Program, unless a warranty or assumption of liability accompanies a +copy of the Program in return for a fee. + + END OF TERMS AND CONDITIONS + + How to Apply These Terms to Your New Programs + + If you develop a new program, and you want it to be of the greatest +possible use to the public, the best way to achieve this is to make it +free software which everyone can redistribute and change under these terms. + + To do so, attach the following notices to the program. It is safest +to attach them to the start of each source file to most effectively +state the exclusion of warranty; and each file should have at least +the "copyright" line and a pointer to where the full notice is found. + + <one line to give the program's name and a brief idea of what it does.> + Copyright (C) <year> <name of author> + + This program is free software: you can redistribute it and/or modify + it under the terms of the GNU General Public License as published by + the Free Software Foundation, either version 3 of the License, or + (at your option) any later version. + + This program is distributed in the hope that it will be useful, + but WITHOUT ANY WARRANTY; without even the implied warranty of + MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the + GNU General Public License for more details. + + You should have received a copy of the GNU General Public License + along with this program. If not, see <https://www.gnu.org/licenses/>. + +Also add information on how to contact you by electronic and paper mail. + + If the program does terminal interaction, make it output a short +notice like this when it starts in an interactive mode: + + <program> Copyright (C) <year> <name of author> + This program comes with ABSOLUTELY NO WARRANTY; for details type `show w'. + This is free software, and you are welcome to redistribute it + under certain conditions; type `show c' for details. + +The hypothetical commands `show w' and `show c' should show the appropriate +parts of the General Public License. Of course, your program's commands +might be different; for a GUI interface, you would use an "about box". + + You should also get your employer (if you work as a programmer) or school, +if any, to sign a "copyright disclaimer" for the program, if necessary. +For more information on this, and how to apply and follow the GNU GPL, see +<https://www.gnu.org/licenses/>. + + The GNU General Public License does not permit incorporating your program +into proprietary programs. If your program is a subroutine library, you +may consider it more useful to permit linking proprietary applications with +the library. If this is what you want to do, use the GNU Lesser General +Public License instead of this License. But first, please read +<https://www.gnu.org/licenses/why-not-lgpl.html>. diff --git a/app.py b/app.py new file mode 100644 index 0000000000000000000000000000000000000000..2e9e90ed98db6ff749c2409acc5093cd57353f03 --- /dev/null +++ b/app.py @@ -0,0 +1,55 @@ +from flask import Flask, render_template, request, redirect, url_for +import subprocess +import os +from werkzeug.utils import secure_filename + +app = Flask(__name__) + +# Configuration for file uploads +UPLOAD_FOLDER = 'uploads' +app.config['UPLOAD_FOLDER'] = UPLOAD_FOLDER +OUTPUT_FOLDER = 'output_files' +app.config['OUTPUT_FOLDER'] = OUTPUT_FOLDER + +@app.route('/', methods=['GET', 'POST']) +def index(): + if request.method == 'POST': + # Handle file uploads + source_file = request.files['source'] + target_file = request.files['target'] + frame_processor = request.form.getlist('frame_processor') + + # Save uploaded files + source_path = os.path.join(app.config['UPLOAD_FOLDER'], secure_filename(source_file.filename)) + target_path = os.path.join(app.config['UPLOAD_FOLDER'], secure_filename(target_file.filename)) + source_file.save(source_path) + target_file.save(target_path) + + # Determine output file name + output_filename = secure_filename('output.jpg') # Default output format is JPEG + + # Build the command based on the provided options + command = ['python', 'run.py', '-s', source_path, '-t', target_path] + command.extend(['-o', os.path.join(app.config['OUTPUT_FOLDER'], output_filename)]) + command.extend(['--frame-processor', *frame_processor]) + + # Execute the command + try: + subprocess.run(command, check=True) + return redirect(url_for('output', filename=output_filename)) + except subprocess.CalledProcessError: + return render_template('error.html') + + return render_template('index.html') + +@app.route('/output/<filename>') +def output(filename): + return render_template('output.html', filename=filename) +@app.route('/output_image/<filename>') +def output_image(filename): + return app.send_static_file(os.path.join(app.config['OUTPUT_FOLDER'], filename)) + +if __name__ == '__main__': + os.makedirs(app.config['UPLOAD_FOLDER'], exist_ok=True) + os.makedirs(app.config['OUTPUT_FOLDER'], exist_ok=True) + app.run(debug=True) diff --git a/gfpgan/weights/detection_Resnet50_Final.pth b/gfpgan/weights/detection_Resnet50_Final.pth new file mode 100644 index 0000000000000000000000000000000000000000..16546738ce0a00a9fd47585e0fc52744d31cc117 --- /dev/null +++ b/gfpgan/weights/detection_Resnet50_Final.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6d1de9c2944f2ccddca5f5e010ea5ae64a39845a86311af6fdf30841b0a5a16d +size 109497761 diff --git a/gfpgan/weights/parsing_parsenet.pth b/gfpgan/weights/parsing_parsenet.pth new file mode 100644 index 0000000000000000000000000000000000000000..1ac2efc50360a79c9905dbac57d9d99cbfbe863c --- /dev/null +++ b/gfpgan/weights/parsing_parsenet.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3d558d8d0e42c20224f13cf5a29c79eba2d59913419f945545d8cf7b72920de2 +size 85331193 diff --git a/models/GFPGANv1.4.pth b/models/GFPGANv1.4.pth new file mode 100644 index 0000000000000000000000000000000000000000..afedb5c7e826056840c9cc183f2c6f0186fd17ba --- /dev/null +++ b/models/GFPGANv1.4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e2cd4703ab14f4d01fd1383a8a8b266f9a5833dacee8e6a79d3bf21a1b6be5ad +size 348632874 diff --git a/models/inswapper_128.onnx b/models/inswapper_128.onnx new file mode 100644 index 0000000000000000000000000000000000000000..cb672b799d74fdf7ab8b172a1b1d78411f6400f5 --- /dev/null +++ b/models/inswapper_128.onnx @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e4a3f08c753cb72d04e10aa0f7dbe3deebbf39567d4ead6dce08e98aa49e16af +size 554253681 diff --git a/mypy.ini b/mypy.ini new file mode 100644 index 0000000000000000000000000000000000000000..64218bc23688632a08c98ec4a0451ed46f8ed5e5 --- /dev/null +++ b/mypy.ini @@ -0,0 +1,7 @@ +[mypy] +check_untyped_defs = True +disallow_any_generics = True +disallow_untyped_calls = True +disallow_untyped_defs = True +ignore_missing_imports = True +strict_optional = False diff --git a/output_files/output.jpg b/output_files/output.jpg new file mode 100644 index 0000000000000000000000000000000000000000..9bd06f34c2b8cae2a985742fd7680561a9863cba Binary files /dev/null and b/output_files/output.jpg differ diff --git a/requirements-headless.txt b/requirements-headless.txt new file mode 100644 index 0000000000000000000000000000000000000000..ce287f52da12b0bcc6cba3c2e244c322742dde16 --- /dev/null +++ b/requirements-headless.txt @@ -0,0 +1,13 @@ +numpy==1.24.3 +opencv-python==4.8.0.74 +onnx==1.14.0 +insightface==0.7.3 +psutil==5.9.5 +tk==0.1.0 +customtkinter==5.2.0 +tkinterdnd2==0.3.0 +onnxruntime==1.15.0 +tensorflow==2.13.0 +opennsfw2==0.10.2 +protobuf==4.23.4 +tqdm==4.65.0 diff --git a/requirements.txt b/requirements.txt new file mode 100644 index 0000000000000000000000000000000000000000..9f289fda318373ab1dc26ade4ff1704bf6ae13e6 --- /dev/null +++ b/requirements.txt @@ -0,0 +1,21 @@ +--extra-index-url https://download.pytorch.org/whl/cu118 + +numpy==1.24.3 +opencv-python==4.8.0.74 +onnx==1.14.0 +insightface==0.7.3 +psutil==5.9.5 +tk==0.1.0 +customtkinter==5.2.0 +tkinterdnd2==0.3.0; sys_platform != 'darwin' and platform_machine != 'arm64' +tkinterdnd2-universal==1.7.3; sys_platform == 'darwin' and platform_machine == 'arm64' +pillow==10.0.0 +onnxruntime==1.15.1; python_version != '3.9' and sys_platform == 'darwin' and platform_machine != 'arm64' +onnxruntime-coreml==1.13.1; python_version == '3.9' and sys_platform == 'darwin' and platform_machine != 'arm64' +onnxruntime-silicon==1.13.1; sys_platform == 'darwin' and platform_machine == 'arm64' +onnxruntime-gpu==1.15.1; sys_platform != 'darwin' +tensorflow==2.13.0 +opennsfw2==0.10.2 +protobuf==4.23.4 +tqdm==4.65.0 +gfpgan==1.3.8 diff --git a/roop/__init__.py b/roop/__init__.py new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/roop/__pycache__/__init__.cpython-310.pyc b/roop/__pycache__/__init__.cpython-310.pyc new file mode 100644 index 0000000000000000000000000000000000000000..a0b7fad842298db1ce5d5b5a1005d254411ba81c Binary files /dev/null and b/roop/__pycache__/__init__.cpython-310.pyc differ diff --git a/roop/__pycache__/capturer.cpython-310.pyc b/roop/__pycache__/capturer.cpython-310.pyc new file mode 100644 index 0000000000000000000000000000000000000000..314d9da20991c043f7ccc98848792bc0f6edfcb1 Binary files /dev/null and b/roop/__pycache__/capturer.cpython-310.pyc differ diff --git a/roop/__pycache__/core.cpython-310.pyc b/roop/__pycache__/core.cpython-310.pyc new file mode 100644 index 0000000000000000000000000000000000000000..bc535923919e9effd430f2cfe9f79f6eb2fc541b Binary files /dev/null and b/roop/__pycache__/core.cpython-310.pyc differ diff --git a/roop/__pycache__/face_analyser.cpython-310.pyc b/roop/__pycache__/face_analyser.cpython-310.pyc new file mode 100644 index 0000000000000000000000000000000000000000..7be5cb2cb25fec66490337267088b259ede362d4 Binary files /dev/null and b/roop/__pycache__/face_analyser.cpython-310.pyc differ diff --git a/roop/__pycache__/face_reference.cpython-310.pyc b/roop/__pycache__/face_reference.cpython-310.pyc new file mode 100644 index 0000000000000000000000000000000000000000..a5f016bfe111c6f615d670fba8df51f35061781f Binary files /dev/null and b/roop/__pycache__/face_reference.cpython-310.pyc differ diff --git a/roop/__pycache__/globals.cpython-310.pyc b/roop/__pycache__/globals.cpython-310.pyc new file mode 100644 index 0000000000000000000000000000000000000000..49fac06bc69699f44abffebe4d9b51ce1a270fc7 Binary files /dev/null and b/roop/__pycache__/globals.cpython-310.pyc differ diff --git a/roop/__pycache__/metadata.cpython-310.pyc b/roop/__pycache__/metadata.cpython-310.pyc new file mode 100644 index 0000000000000000000000000000000000000000..55ba80562849d310fd6be2b66c1f098f9ccc10c8 Binary files /dev/null and b/roop/__pycache__/metadata.cpython-310.pyc differ diff --git a/roop/__pycache__/predictor.cpython-310.pyc b/roop/__pycache__/predictor.cpython-310.pyc new file mode 100644 index 0000000000000000000000000000000000000000..cda1076af3882e18abac2d01639289396d753094 Binary files /dev/null and b/roop/__pycache__/predictor.cpython-310.pyc differ diff --git a/roop/__pycache__/typing.cpython-310.pyc b/roop/__pycache__/typing.cpython-310.pyc new file mode 100644 index 0000000000000000000000000000000000000000..3ef3c36b9d99d430908edca3b88ad8a71b2c4dfb Binary files /dev/null and b/roop/__pycache__/typing.cpython-310.pyc differ diff --git a/roop/__pycache__/ui.cpython-310.pyc b/roop/__pycache__/ui.cpython-310.pyc new file mode 100644 index 0000000000000000000000000000000000000000..5dacc4fc186122d50a8f9edaccfaa7ebdcda0a25 Binary files /dev/null and b/roop/__pycache__/ui.cpython-310.pyc differ diff --git a/roop/__pycache__/utilities.cpython-310.pyc b/roop/__pycache__/utilities.cpython-310.pyc new file mode 100644 index 0000000000000000000000000000000000000000..10958b008d149cd5125ac72794bcbb0074ed1902 Binary files /dev/null and b/roop/__pycache__/utilities.cpython-310.pyc differ diff --git a/roop/capturer.py b/roop/capturer.py new file mode 100644 index 0000000000000000000000000000000000000000..515fc8e54a9a3709ceee4c340f33e0b907416073 --- /dev/null +++ b/roop/capturer.py @@ -0,0 +1,22 @@ +from typing import Optional +import cv2 + +from roop.typing import Frame + + +def get_video_frame(video_path: str, frame_number: int = 0) -> Optional[Frame]: + capture = cv2.VideoCapture(video_path) + frame_total = capture.get(cv2.CAP_PROP_FRAME_COUNT) + capture.set(cv2.CAP_PROP_POS_FRAMES, min(frame_total, frame_number - 1)) + has_frame, frame = capture.read() + capture.release() + if has_frame: + return frame + return None + + +def get_video_frame_total(video_path: str) -> int: + capture = cv2.VideoCapture(video_path) + video_frame_total = int(capture.get(cv2.CAP_PROP_FRAME_COUNT)) + capture.release() + return video_frame_total diff --git a/roop/core.py b/roop/core.py new file mode 100644 index 0000000000000000000000000000000000000000..7e5a46fbd25334bce072c65f3132b56c6b39358e --- /dev/null +++ b/roop/core.py @@ -0,0 +1,220 @@ +#!/usr/bin/env python3 + +import os +import sys +# single thread doubles cuda performance - needs to be set before torch import +if any(arg.startswith('--execution-provider') for arg in sys.argv): + os.environ['OMP_NUM_THREADS'] = '1' +# reduce tensorflow log level +os.environ['TF_CPP_MIN_LOG_LEVEL'] = '2' +import warnings +from typing import List +import platform +import signal +import shutil +import argparse +import onnxruntime +import tensorflow +import roop.globals +import roop.metadata +import roop.ui as ui +from roop.predictor import predict_image, predict_video +from roop.processors.frame.core import get_frame_processors_modules +from roop.utilities import has_image_extension, is_image, is_video, detect_fps, create_video, extract_frames, get_temp_frame_paths, restore_audio, create_temp, move_temp, clean_temp, normalize_output_path + +warnings.filterwarnings('ignore', category=FutureWarning, module='insightface') +warnings.filterwarnings('ignore', category=UserWarning, module='torchvision') + + +def parse_args() -> None: + signal.signal(signal.SIGINT, lambda signal_number, frame: destroy()) + program = argparse.ArgumentParser(formatter_class=lambda prog: argparse.HelpFormatter(prog, max_help_position=100)) + program.add_argument('-s', '--source', help='select an source image', dest='source_path') + program.add_argument('-t', '--target', help='select an target image or video', dest='target_path') + program.add_argument('-o', '--output', help='select output file or directory', dest='output_path') + program.add_argument('--frame-processor', help='frame processors (choices: face_swapper, face_enhancer, ...)', dest='frame_processor', default=['face_swapper'], nargs='+') + program.add_argument('--keep-fps', help='keep target fps', dest='keep_fps', action='store_true') + program.add_argument('--keep-frames', help='keep temporary frames', dest='keep_frames', action='store_true') + program.add_argument('--skip-audio', help='skip target audio', dest='skip_audio', action='store_true') + program.add_argument('--many-faces', help='process every face', dest='many_faces', action='store_true') + program.add_argument('--reference-face-position', help='position of the reference face', dest='reference_face_position', type=int, default=0) + program.add_argument('--reference-frame-number', help='number of the reference frame', dest='reference_frame_number', type=int, default=0) + program.add_argument('--similar-face-distance', help='face distance used for recognition', dest='similar_face_distance', type=float, default=0.85) + program.add_argument('--temp-frame-format', help='image format used for frame extraction', dest='temp_frame_format', default='png', choices=['jpg', 'png']) + program.add_argument('--temp-frame-quality', help='image quality used for frame extraction', dest='temp_frame_quality', type=int, default=0, choices=range(101), metavar='[0-100]') + program.add_argument('--output-video-encoder', help='encoder used for the output video', dest='output_video_encoder', default='libx264', choices=['libx264', 'libx265', 'libvpx-vp9', 'h264_nvenc', 'hevc_nvenc']) + program.add_argument('--output-video-quality', help='quality used for the output video', dest='output_video_quality', type=int, default=35, choices=range(101), metavar='[0-100]') + program.add_argument('--max-memory', help='maximum amount of RAM in GB', dest='max_memory', type=int) + program.add_argument('--execution-provider', help='available execution provider (choices: cpu, ...)', dest='execution_provider', default=['cpu'], choices=suggest_execution_providers(), nargs='+') + program.add_argument('--execution-threads', help='number of execution threads', dest='execution_threads', type=int, default=suggest_execution_threads()) + program.add_argument('-v', '--version', action='version', version=f'{roop.metadata.name} {roop.metadata.version}') + + args = program.parse_args() + + roop.globals.source_path = args.source_path + roop.globals.target_path = args.target_path + roop.globals.output_path = normalize_output_path(roop.globals.source_path, roop.globals.target_path, args.output_path) + roop.globals.headless = roop.globals.source_path is not None and roop.globals.target_path is not None and roop.globals.output_path is not None + roop.globals.frame_processors = args.frame_processor + roop.globals.keep_fps = args.keep_fps + roop.globals.keep_frames = args.keep_frames + roop.globals.skip_audio = args.skip_audio + roop.globals.many_faces = args.many_faces + roop.globals.reference_face_position = args.reference_face_position + roop.globals.reference_frame_number = args.reference_frame_number + roop.globals.similar_face_distance = args.similar_face_distance + roop.globals.temp_frame_format = args.temp_frame_format + roop.globals.temp_frame_quality = args.temp_frame_quality + roop.globals.output_video_encoder = args.output_video_encoder + roop.globals.output_video_quality = args.output_video_quality + roop.globals.max_memory = args.max_memory + roop.globals.execution_providers = decode_execution_providers(args.execution_provider) + roop.globals.execution_threads = args.execution_threads + + +def encode_execution_providers(execution_providers: List[str]) -> List[str]: + return [execution_provider.replace('ExecutionProvider', '').lower() for execution_provider in execution_providers] + + +def decode_execution_providers(execution_providers: List[str]) -> List[str]: + return [provider for provider, encoded_execution_provider in zip(onnxruntime.get_available_providers(), encode_execution_providers(onnxruntime.get_available_providers())) + if any(execution_provider in encoded_execution_provider for execution_provider in execution_providers)] + + +def suggest_execution_providers() -> List[str]: + return encode_execution_providers(onnxruntime.get_available_providers()) + + +def suggest_execution_threads() -> int: + if 'CUDAExecutionProvider' in onnxruntime.get_available_providers(): + return 8 + return 1 + + +def limit_resources() -> None: + # prevent tensorflow memory leak + gpus = tensorflow.config.experimental.list_physical_devices('GPU') + for gpu in gpus: + tensorflow.config.experimental.set_virtual_device_configuration(gpu, [ + tensorflow.config.experimental.VirtualDeviceConfiguration(memory_limit=1024) + ]) + # limit memory usage + if roop.globals.max_memory: + memory = roop.globals.max_memory * 1024 ** 3 + if platform.system().lower() == 'darwin': + memory = roop.globals.max_memory * 1024 ** 6 + if platform.system().lower() == 'windows': + import ctypes + kernel32 = ctypes.windll.kernel32 # type: ignore[attr-defined] + kernel32.SetProcessWorkingSetSize(-1, ctypes.c_size_t(memory), ctypes.c_size_t(memory)) + else: + import resource + resource.setrlimit(resource.RLIMIT_DATA, (memory, memory)) + + +def pre_check() -> bool: + if sys.version_info < (3, 9): + update_status('Python version is not supported - please upgrade to 3.9 or higher.') + return False + if not shutil.which('ffmpeg'): + update_status('ffmpeg is not installed.') + return False + return True + + +def update_status(message: str, scope: str = 'ROOP.CORE') -> None: + print(f'[{scope}] {message}') + if not roop.globals.headless: + ui.update_status(message) + + +def start() -> None: + for frame_processor in get_frame_processors_modules(roop.globals.frame_processors): + if not frame_processor.pre_start(): + return + # process image to image + if has_image_extension(roop.globals.target_path): + if predict_image(roop.globals.target_path): + destroy() + shutil.copy2(roop.globals.target_path, roop.globals.output_path) + # process frame + for frame_processor in get_frame_processors_modules(roop.globals.frame_processors): + update_status('Progressing...', frame_processor.NAME) + frame_processor.process_image(roop.globals.source_path, roop.globals.output_path, roop.globals.output_path) + frame_processor.post_process() + # validate image + if is_image(roop.globals.target_path): + update_status('Processing to image succeed!') + else: + update_status('Processing to image failed!') + return + # process image to videos + if predict_video(roop.globals.target_path): + destroy() + update_status('Creating temporary resources...') + create_temp(roop.globals.target_path) + # extract frames + if roop.globals.keep_fps: + fps = detect_fps(roop.globals.target_path) + update_status(f'Extracting frames with {fps} FPS...') + extract_frames(roop.globals.target_path, fps) + else: + update_status('Extracting frames with 30 FPS...') + extract_frames(roop.globals.target_path) + # process frame + temp_frame_paths = get_temp_frame_paths(roop.globals.target_path) + if temp_frame_paths: + for frame_processor in get_frame_processors_modules(roop.globals.frame_processors): + update_status('Progressing...', frame_processor.NAME) + frame_processor.process_video(roop.globals.source_path, temp_frame_paths) + frame_processor.post_process() + else: + update_status('Frames not found...') + return + # create video + if roop.globals.keep_fps: + fps = detect_fps(roop.globals.target_path) + update_status(f'Creating video with {fps} FPS...') + create_video(roop.globals.target_path, fps) + else: + update_status('Creating video with 30 FPS...') + create_video(roop.globals.target_path) + # handle audio + if roop.globals.skip_audio: + move_temp(roop.globals.target_path, roop.globals.output_path) + update_status('Skipping audio...') + else: + if roop.globals.keep_fps: + update_status('Restoring audio...') + else: + update_status('Restoring audio might cause issues as fps are not kept...') + restore_audio(roop.globals.target_path, roop.globals.output_path) + # clean temp + update_status('Cleaning temporary resources...') + clean_temp(roop.globals.target_path) + # validate video + if is_video(roop.globals.target_path): + update_status('Processing to video succeed!') + else: + update_status('Processing to video failed!') + + +def destroy() -> None: + if roop.globals.target_path: + clean_temp(roop.globals.target_path) + sys.exit() + + +def run() -> None: + parse_args() + if not pre_check(): + return + for frame_processor in get_frame_processors_modules(roop.globals.frame_processors): + if not frame_processor.pre_check(): + return + limit_resources() + if roop.globals.headless: + start() + else: + window = ui.init(start, destroy) + window.mainloop() diff --git a/roop/face_analyser.py b/roop/face_analyser.py new file mode 100644 index 0000000000000000000000000000000000000000..81cd39100122c64023ad01ac0e8b457a812a0216 --- /dev/null +++ b/roop/face_analyser.py @@ -0,0 +1,54 @@ +import threading +from typing import Any, Optional, List +import insightface +import numpy + +import roop.globals +from roop.typing import Frame, Face + +FACE_ANALYSER = None +THREAD_LOCK = threading.Lock() + + +def get_face_analyser() -> Any: + global FACE_ANALYSER + + with THREAD_LOCK: + if FACE_ANALYSER is None: + FACE_ANALYSER = insightface.app.FaceAnalysis(name='buffalo_l', providers=roop.globals.execution_providers) + FACE_ANALYSER.prepare(ctx_id=0) + return FACE_ANALYSER + + +def clear_face_analyser() -> Any: + global FACE_ANALYSER + + FACE_ANALYSER = None + + +def get_one_face(frame: Frame, position: int = 0) -> Optional[Face]: + many_faces = get_many_faces(frame) + if many_faces: + try: + return many_faces[position] + except IndexError: + return many_faces[-1] + return None + + +def get_many_faces(frame: Frame) -> Optional[List[Face]]: + try: + return get_face_analyser().get(frame) + except ValueError: + return None + + +def find_similar_face(frame: Frame, reference_face: Face) -> Optional[Face]: + many_faces = get_many_faces(frame) + if many_faces: + for face in many_faces: + if hasattr(face, 'normed_embedding') and hasattr(reference_face, 'normed_embedding'): + distance = numpy.sum(numpy.square(face.normed_embedding - reference_face.normed_embedding)) + if distance < roop.globals.similar_face_distance: + return face + return None diff --git a/roop/face_reference.py b/roop/face_reference.py new file mode 100644 index 0000000000000000000000000000000000000000..3c3e1f1c6e13c73ceafd40c0912c066a3a86a528 --- /dev/null +++ b/roop/face_reference.py @@ -0,0 +1,21 @@ +from typing import Optional + +from roop.typing import Face + +FACE_REFERENCE = None + + +def get_face_reference() -> Optional[Face]: + return FACE_REFERENCE + + +def set_face_reference(face: Face) -> None: + global FACE_REFERENCE + + FACE_REFERENCE = face + + +def clear_face_reference() -> None: + global FACE_REFERENCE + + FACE_REFERENCE = None diff --git a/roop/globals.py b/roop/globals.py new file mode 100644 index 0000000000000000000000000000000000000000..3eca8d0d024db967cc6d7e7149f68f65f84d7072 --- /dev/null +++ b/roop/globals.py @@ -0,0 +1,22 @@ +from typing import List, Optional + +source_path: Optional[str] = None +target_path: Optional[str] = None +output_path: Optional[str] = None +headless: Optional[bool] = None +frame_processors: List[str] = [] +keep_fps: Optional[bool] = None +keep_frames: Optional[bool] = None +skip_audio: Optional[bool] = None +many_faces: Optional[bool] = None +reference_face_position: Optional[int] = None +reference_frame_number: Optional[int] = None +similar_face_distance: Optional[float] = None +temp_frame_format: Optional[str] = None +temp_frame_quality: Optional[int] = None +output_video_encoder: Optional[str] = None +output_video_quality: Optional[int] = None +max_memory: Optional[int] = None +execution_providers: List[str] = [] +execution_threads: Optional[int] = None +log_level: str = 'error' diff --git a/roop/metadata.py b/roop/metadata.py new file mode 100644 index 0000000000000000000000000000000000000000..aea9e16d897ede57f566ccc773d0d2ee17905dfb --- /dev/null +++ b/roop/metadata.py @@ -0,0 +1,2 @@ +name = 'roop' +version = '1.3.2' diff --git a/roop/predictor.py b/roop/predictor.py new file mode 100644 index 0000000000000000000000000000000000000000..b59fee93e02daeec6660139b61c2cd76d5fd2b94 --- /dev/null +++ b/roop/predictor.py @@ -0,0 +1,43 @@ +import threading +import numpy +import opennsfw2 +from PIL import Image +from keras import Model + +from roop.typing import Frame + +PREDICTOR = None +THREAD_LOCK = threading.Lock() +MAX_PROBABILITY = 0.85 + + +def get_predictor() -> Model: + global PREDICTOR + + with THREAD_LOCK: + if PREDICTOR is None: + PREDICTOR = opennsfw2.make_open_nsfw_model() + return PREDICTOR + + +def clear_predictor() -> None: + global PREDICTOR + + PREDICTOR = None + + +def predict_frame(target_frame: Frame) -> bool: + image = Image.fromarray(target_frame) + image = opennsfw2.preprocess_image(image, opennsfw2.Preprocessing.YAHOO) + views = numpy.expand_dims(image, axis=0) + _, probability = get_predictor().predict(views)[0] + return probability > MAX_PROBABILITY + + +def predict_image(target_path: str) -> bool: + return opennsfw2.predict_image(target_path) > MAX_PROBABILITY + + +def predict_video(target_path: str) -> bool: + _, probabilities = opennsfw2.predict_video_frames(video_path=target_path, frame_interval=100) + return any(probability > MAX_PROBABILITY for probability in probabilities) diff --git a/roop/processors/__init__.py b/roop/processors/__init__.py new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/roop/processors/__pycache__/__init__.cpython-310.pyc b/roop/processors/__pycache__/__init__.cpython-310.pyc new file mode 100644 index 0000000000000000000000000000000000000000..3756ea9728ef20e444641d0e62affa7bf051f081 Binary files /dev/null and b/roop/processors/__pycache__/__init__.cpython-310.pyc differ diff --git a/roop/processors/frame/__init__.py b/roop/processors/frame/__init__.py new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/roop/processors/frame/__pycache__/__init__.cpython-310.pyc b/roop/processors/frame/__pycache__/__init__.cpython-310.pyc new file mode 100644 index 0000000000000000000000000000000000000000..54a301f2d5c7fbf31a94f06eee7cd9924ffcf74f Binary files /dev/null and b/roop/processors/frame/__pycache__/__init__.cpython-310.pyc differ diff --git a/roop/processors/frame/__pycache__/core.cpython-310.pyc b/roop/processors/frame/__pycache__/core.cpython-310.pyc new file mode 100644 index 0000000000000000000000000000000000000000..2c999f1f47c0be4b0a35c147c875019dd90c9664 Binary files /dev/null and b/roop/processors/frame/__pycache__/core.cpython-310.pyc differ diff --git a/roop/processors/frame/__pycache__/face_enhancer.cpython-310.pyc b/roop/processors/frame/__pycache__/face_enhancer.cpython-310.pyc new file mode 100644 index 0000000000000000000000000000000000000000..819c489f8e58916d9e0cbcbffd006a62c4c9699a Binary files /dev/null and b/roop/processors/frame/__pycache__/face_enhancer.cpython-310.pyc differ diff --git a/roop/processors/frame/__pycache__/face_swapper.cpython-310.pyc b/roop/processors/frame/__pycache__/face_swapper.cpython-310.pyc new file mode 100644 index 0000000000000000000000000000000000000000..71df834ce0c075ea3da64d859fa1c65f51898dfa Binary files /dev/null and b/roop/processors/frame/__pycache__/face_swapper.cpython-310.pyc differ diff --git a/roop/processors/frame/core.py b/roop/processors/frame/core.py new file mode 100644 index 0000000000000000000000000000000000000000..498169d34a00e0a2547940380afd69967a2eca8c --- /dev/null +++ b/roop/processors/frame/core.py @@ -0,0 +1,91 @@ +import os +import sys +import importlib +import psutil +from concurrent.futures import ThreadPoolExecutor, as_completed +from queue import Queue +from types import ModuleType +from typing import Any, List, Callable +from tqdm import tqdm + +import roop + +FRAME_PROCESSORS_MODULES: List[ModuleType] = [] +FRAME_PROCESSORS_INTERFACE = [ + 'pre_check', + 'pre_start', + 'process_frame', + 'process_frames', + 'process_image', + 'process_video', + 'post_process' +] + + +def load_frame_processor_module(frame_processor: str) -> Any: + try: + frame_processor_module = importlib.import_module(f'roop.processors.frame.{frame_processor}') + for method_name in FRAME_PROCESSORS_INTERFACE: + if not hasattr(frame_processor_module, method_name): + raise NotImplementedError + except ModuleNotFoundError: + sys.exit(f'Frame processor {frame_processor} not found.') + except NotImplementedError: + sys.exit(f'Frame processor {frame_processor} not implemented correctly.') + return frame_processor_module + + +def get_frame_processors_modules(frame_processors: List[str]) -> List[ModuleType]: + global FRAME_PROCESSORS_MODULES + + if not FRAME_PROCESSORS_MODULES: + for frame_processor in frame_processors: + frame_processor_module = load_frame_processor_module(frame_processor) + FRAME_PROCESSORS_MODULES.append(frame_processor_module) + return FRAME_PROCESSORS_MODULES + + +def multi_process_frame(source_path: str, temp_frame_paths: List[str], process_frames: Callable[[str, List[str], Any], None], update: Callable[[], None]) -> None: + with ThreadPoolExecutor(max_workers=roop.globals.execution_threads) as executor: + futures = [] + queue = create_queue(temp_frame_paths) + queue_per_future = max(len(temp_frame_paths) // roop.globals.execution_threads, 1) + while not queue.empty(): + future = executor.submit(process_frames, source_path, pick_queue(queue, queue_per_future), update) + futures.append(future) + for future in as_completed(futures): + future.result() + + +def create_queue(temp_frame_paths: List[str]) -> Queue[str]: + queue: Queue[str] = Queue() + for frame_path in temp_frame_paths: + queue.put(frame_path) + return queue + + +def pick_queue(queue: Queue[str], queue_per_future: int) -> List[str]: + queues = [] + for _ in range(queue_per_future): + if not queue.empty(): + queues.append(queue.get()) + return queues + + +def process_video(source_path: str, frame_paths: list[str], process_frames: Callable[[str, List[str], Any], None]) -> None: + progress_bar_format = '{l_bar}{bar}| {n_fmt}/{total_fmt} [{elapsed}<{remaining}, {rate_fmt}{postfix}]' + total = len(frame_paths) + with tqdm(total=total, desc='Processing', unit='frame', dynamic_ncols=True, bar_format=progress_bar_format) as progress: + multi_process_frame(source_path, frame_paths, process_frames, lambda: update_progress(progress)) + + +def update_progress(progress: Any = None) -> None: + process = psutil.Process(os.getpid()) + memory_usage = process.memory_info().rss / 1024 / 1024 / 1024 + progress.set_postfix({ + 'memory_usage': '{:.2f}'.format(memory_usage).zfill(5) + 'GB', + 'execution_providers': roop.globals.execution_providers, + 'execution_threads': roop.globals.execution_threads + }) + progress.refresh() + progress.update(1) diff --git a/roop/processors/frame/face_enhancer.py b/roop/processors/frame/face_enhancer.py new file mode 100644 index 0000000000000000000000000000000000000000..3a7f5a217f1e7f3f6d23f42fcbe97145d0ce1c2d --- /dev/null +++ b/roop/processors/frame/face_enhancer.py @@ -0,0 +1,104 @@ +from typing import Any, List, Callable +import cv2 +import threading +from gfpgan.utils import GFPGANer + +import roop.globals +import roop.processors.frame.core +from roop.core import update_status +from roop.face_analyser import get_many_faces +from roop.typing import Frame, Face +from roop.utilities import conditional_download, resolve_relative_path, is_image, is_video + +FACE_ENHANCER = None +THREAD_SEMAPHORE = threading.Semaphore() +THREAD_LOCK = threading.Lock() +NAME = 'ROOP.FACE-ENHANCER' + + +def get_face_enhancer() -> Any: + global FACE_ENHANCER + + with THREAD_LOCK: + if FACE_ENHANCER is None: + model_path = resolve_relative_path('../models/GFPGANv1.4.pth') + # todo: set models path -> https://github.com/TencentARC/GFPGAN/issues/399 + FACE_ENHANCER = GFPGANer(model_path=model_path, upscale=1, device=get_device()) + return FACE_ENHANCER + + +def get_device() -> str: + if 'CUDAExecutionProvider' in roop.globals.execution_providers: + return 'cuda' + if 'CoreMLExecutionProvider' in roop.globals.execution_providers: + return 'mps' + return 'cpu' + + +def clear_face_enhancer() -> None: + global FACE_ENHANCER + + FACE_ENHANCER = None + + +def pre_check() -> bool: + download_directory_path = resolve_relative_path('../models') + conditional_download(download_directory_path, ['https://huggingface.co/henryruhs/roop/resolve/main/GFPGANv1.4.pth']) + return True + + +def pre_start() -> bool: + if not is_image(roop.globals.target_path) and not is_video(roop.globals.target_path): + update_status('Select an image or video for target path.', NAME) + return False + return True + + +def post_process() -> None: + clear_face_enhancer() + + +def enhance_face(target_face: Face, temp_frame: Frame) -> Frame: + start_x, start_y, end_x, end_y = map(int, target_face['bbox']) + padding_x = int((end_x - start_x) * 0.5) + padding_y = int((end_y - start_y) * 0.5) + start_x = max(0, start_x - padding_x) + start_y = max(0, start_y - padding_y) + end_x = max(0, end_x + padding_x) + end_y = max(0, end_y + padding_y) + temp_face = temp_frame[start_y:end_y, start_x:end_x] + if temp_face.size: + with THREAD_SEMAPHORE: + _, _, temp_face = get_face_enhancer().enhance( + temp_face, + paste_back=True + ) + temp_frame[start_y:end_y, start_x:end_x] = temp_face + return temp_frame + + +def process_frame(source_face: Face, reference_face: Face, temp_frame: Frame) -> Frame: + many_faces = get_many_faces(temp_frame) + if many_faces: + for target_face in many_faces: + temp_frame = enhance_face(target_face, temp_frame) + return temp_frame + + +def process_frames(source_path: str, temp_frame_paths: List[str], update: Callable[[], None]) -> None: + for temp_frame_path in temp_frame_paths: + temp_frame = cv2.imread(temp_frame_path) + result = process_frame(None, None, temp_frame) + cv2.imwrite(temp_frame_path, result) + if update: + update() + + +def process_image(source_path: str, target_path: str, output_path: str) -> None: + target_frame = cv2.imread(target_path) + result = process_frame(None, None, target_frame) + cv2.imwrite(output_path, result) + + +def process_video(source_path: str, temp_frame_paths: List[str]) -> None: + roop.processors.frame.core.process_video(None, temp_frame_paths, process_frames) diff --git a/roop/processors/frame/face_swapper.py b/roop/processors/frame/face_swapper.py new file mode 100644 index 0000000000000000000000000000000000000000..b8072076f11bd3dc836b66afb5ebc7619bdce424 --- /dev/null +++ b/roop/processors/frame/face_swapper.py @@ -0,0 +1,100 @@ +from typing import Any, List, Callable +import cv2 +import insightface +import threading + +import roop.globals +import roop.processors.frame.core +from roop.core import update_status +from roop.face_analyser import get_one_face, get_many_faces, find_similar_face +from roop.face_reference import get_face_reference, set_face_reference, clear_face_reference +from roop.typing import Face, Frame +from roop.utilities import conditional_download, resolve_relative_path, is_image, is_video + +FACE_SWAPPER = None +THREAD_LOCK = threading.Lock() +NAME = 'ROOP.FACE-SWAPPER' + + +def get_face_swapper() -> Any: + global FACE_SWAPPER + + with THREAD_LOCK: + if FACE_SWAPPER is None: + model_path = resolve_relative_path('../models/inswapper_128.onnx') + FACE_SWAPPER = insightface.model_zoo.get_model(model_path, providers=roop.globals.execution_providers) + return FACE_SWAPPER + + +def clear_face_swapper() -> None: + global FACE_SWAPPER + + FACE_SWAPPER = None + + +def pre_check() -> bool: + download_directory_path = resolve_relative_path('../models') + conditional_download(download_directory_path, ['https://huggingface.co/henryruhs/roop/resolve/main/inswapper_128.onnx']) + return True + + +def pre_start() -> bool: + if not is_image(roop.globals.source_path): + update_status('Select an image for source path.', NAME) + return False + elif not get_one_face(cv2.imread(roop.globals.source_path)): + update_status('No face in source path detected.', NAME) + return False + if not is_image(roop.globals.target_path) and not is_video(roop.globals.target_path): + update_status('Select an image or video for target path.', NAME) + return False + return True + + +def post_process() -> None: + clear_face_swapper() + clear_face_reference() + + +def swap_face(source_face: Face, target_face: Face, temp_frame: Frame) -> Frame: + return get_face_swapper().get(temp_frame, target_face, source_face, paste_back=True) + + +def process_frame(source_face: Face, reference_face: Face, temp_frame: Frame) -> Frame: + if roop.globals.many_faces: + many_faces = get_many_faces(temp_frame) + if many_faces: + for target_face in many_faces: + temp_frame = swap_face(source_face, target_face, temp_frame) + else: + target_face = find_similar_face(temp_frame, reference_face) + if target_face: + temp_frame = swap_face(source_face, target_face, temp_frame) + return temp_frame + + +def process_frames(source_path: str, temp_frame_paths: List[str], update: Callable[[], None]) -> None: + source_face = get_one_face(cv2.imread(source_path)) + reference_face = None if roop.globals.many_faces else get_face_reference() + for temp_frame_path in temp_frame_paths: + temp_frame = cv2.imread(temp_frame_path) + result = process_frame(source_face, reference_face, temp_frame) + cv2.imwrite(temp_frame_path, result) + if update: + update() + + +def process_image(source_path: str, target_path: str, output_path: str) -> None: + source_face = get_one_face(cv2.imread(source_path)) + target_frame = cv2.imread(target_path) + reference_face = None if roop.globals.many_faces else get_one_face(target_frame, roop.globals.reference_face_position) + result = process_frame(source_face, reference_face, target_frame) + cv2.imwrite(output_path, result) + + +def process_video(source_path: str, temp_frame_paths: List[str]) -> None: + if not roop.globals.many_faces and not get_face_reference(): + reference_frame = cv2.imread(temp_frame_paths[roop.globals.reference_frame_number]) + reference_face = get_one_face(reference_frame, roop.globals.reference_face_position) + set_face_reference(reference_face) + roop.processors.frame.core.process_video(source_path, temp_frame_paths, process_frames) diff --git a/roop/typing.py b/roop/typing.py new file mode 100644 index 0000000000000000000000000000000000000000..1cff7440616e20bfe7b8bc287f86d11bf1b0f083 --- /dev/null +++ b/roop/typing.py @@ -0,0 +1,7 @@ +from typing import Any + +from insightface.app.common import Face +import numpy + +Face = Face +Frame = numpy.ndarray[Any, Any] diff --git a/roop/ui.json b/roop/ui.json new file mode 100644 index 0000000000000000000000000000000000000000..cf63a226f37feed2fd3c08f50b4becbd74e69613 --- /dev/null +++ b/roop/ui.json @@ -0,0 +1,161 @@ +{ + "CTk": { + "fg_color": ["gray95", "gray10"] + }, + "CTkToplevel": { + "fg_color": ["gray95", "gray10"] + }, + "CTkFrame": { + "corner_radius": 6, + "border_width": 0, + "fg_color": ["gray90", "gray13"], + "top_fg_color": ["gray85", "gray16"], + "border_color": ["gray65", "gray28"] + }, + "CTkButton": { + "corner_radius": 6, + "border_width": 0, + "fg_color": ["#3a7ebf", "#1f538d"], + "hover_color": ["#325882", "#14375e"], + "border_color": ["#3E454A", "#949A9F"], + "text_color": ["#DCE4EE", "#DCE4EE"], + "text_color_disabled": ["gray74", "gray60"] + }, + "CTkLabel": { + "corner_radius": 0, + "fg_color": "transparent", + "text_color": ["gray14", "gray84"] + }, + "CTkEntry": { + "corner_radius": 6, + "border_width": 2, + "fg_color": ["#F9F9FA", "#343638"], + "border_color": ["#979DA2", "#565B5E"], + "text_color": ["gray14", "gray84"], + "placeholder_text_color": ["gray52", "gray62"] + }, + "CTkCheckbox": { + "corner_radius": 6, + "border_width": 3, + "fg_color": ["#3a7ebf", "#1f538d"], + "border_color": ["#3E454A", "#949A9F"], + "hover_color": ["#325882", "#14375e"], + "checkmark_color": ["#DCE4EE", "gray90"], + "text_color": ["gray14", "gray84"], + "text_color_disabled": ["gray60", "gray45"] + }, + "CTkSwitch": { + "corner_radius": 1000, + "border_width": 3, + "button_length": 0, + "fg_color": ["#939BA2", "#4A4D50"], + "progress_color": ["#3a7ebf", "#1f538d"], + "button_color": ["gray36", "#D5D9DE"], + "button_hover_color": ["gray20", "gray100"], + "text_color": ["gray14", "gray84"], + "text_color_disabled": ["gray60", "gray45"] + }, + "CTkRadiobutton": { + "corner_radius": 1000, + "border_width_checked": 6, + "border_width_unchecked": 3, + "fg_color": ["#3a7ebf", "#1f538d"], + "border_color": ["#3E454A", "#949A9F"], + "hover_color": ["#325882", "#14375e"], + "text_color": ["gray14", "gray84"], + "text_color_disabled": ["gray60", "gray45"] + }, + "CTkProgressBar": { + "corner_radius": 1000, + "border_width": 0, + "fg_color": ["#939BA2", "#4A4D50"], + "progress_color": ["#3a7ebf", "#1f538d"], + "border_color": ["gray", "gray"] + }, + "CTkSlider": { + "corner_radius": 1000, + "button_corner_radius": 1000, + "border_width": 6, + "button_length": 0, + "fg_color": ["#939BA2", "#4A4D50"], + "progress_color": ["gray40", "#AAB0B5"], + "button_color": ["#3a7ebf", "#1f538d"], + "button_hover_color": ["#325882", "#14375e"] + }, + "CTkOptionMenu": { + "corner_radius": 6, + "fg_color": ["#3a7ebf", "#1f538d"], + "button_color": ["#325882", "#14375e"], + "button_hover_color": ["#234567", "#1e2c40"], + "text_color": ["#DCE4EE", "#DCE4EE"], + "text_color_disabled": ["gray74", "gray60"] + }, + "CTkComboBox": { + "corner_radius": 6, + "border_width": 2, + "fg_color": ["#F9F9FA", "#343638"], + "border_color": ["#979DA2", "#565B5E"], + "button_color": ["#979DA2", "#565B5E"], + "button_hover_color": ["#6E7174", "#7A848D"], + "text_color": ["gray14", "gray84"], + "text_color_disabled": ["gray50", "gray45"] + }, + "CTkScrollbar": { + "corner_radius": 1000, + "border_spacing": 4, + "fg_color": "transparent", + "button_color": ["gray55", "gray41"], + "button_hover_color": ["gray40", "gray53"] + }, + "CTkSegmentedButton": { + "corner_radius": 6, + "border_width": 2, + "fg_color": ["#979DA2", "gray29"], + "selected_color": ["#3a7ebf", "#1f538d"], + "selected_hover_color": ["#325882", "#14375e"], + "unselected_color": ["#979DA2", "gray29"], + "unselected_hover_color": ["gray70", "gray41"], + "text_color": ["#DCE4EE", "#DCE4EE"], + "text_color_disabled": ["gray74", "gray60"] + }, + "CTkTextbox": { + "corner_radius": 6, + "border_width": 0, + "fg_color": ["gray100", "gray20"], + "border_color": ["#979DA2", "#565B5E"], + "text_color": ["gray14", "gray84"], + "scrollbar_button_color": ["gray55", "gray41"], + "scrollbar_button_hover_color": ["gray40", "gray53"] + }, + "CTkScrollableFrame": { + "label_fg_color": ["gray80", "gray21"] + }, + "DropdownMenu": { + "fg_color": ["gray90", "gray20"], + "hover_color": ["gray75", "gray28"], + "text_color": ["gray14", "gray84"] + }, + "CTkFont": { + "macOS": { + "family": "Avenir", + "size": 12, + "weight": "normal" + }, + "Windows": { + "family": "Corbel", + "size": 12, + "weight": "normal" + }, + "Linux": { + "family": "Montserrat", + "size": 12, + "weight": "normal" + } + }, + "RoopDropArea": { + "fg_color": ["gray90", "gray13"] + }, + "RoopDonate": { + "text_color": ["#3a7ebf", "gray60"] + } +} diff --git a/roop/ui.py b/roop/ui.py new file mode 100644 index 0000000000000000000000000000000000000000..cebe6a20c3bc63dbecdff85ba387bfab73b15232 --- /dev/null +++ b/roop/ui.py @@ -0,0 +1,285 @@ +import os +import sys +import webbrowser +import customtkinter as ctk +from tkinterdnd2 import TkinterDnD, DND_ALL +from typing import Any, Callable, Tuple, Optional +import cv2 +from PIL import Image, ImageOps + +import roop.globals +import roop.metadata +from roop.face_analyser import get_one_face +from roop.capturer import get_video_frame, get_video_frame_total +from roop.face_reference import get_face_reference, set_face_reference, clear_face_reference +from roop.predictor import predict_frame, clear_predictor +from roop.processors.frame.core import get_frame_processors_modules +from roop.utilities import is_image, is_video, resolve_relative_path + +ROOT = None +ROOT_HEIGHT = 700 +ROOT_WIDTH = 600 + +PREVIEW = None +PREVIEW_MAX_HEIGHT = 700 +PREVIEW_MAX_WIDTH = 1200 + +RECENT_DIRECTORY_SOURCE = None +RECENT_DIRECTORY_TARGET = None +RECENT_DIRECTORY_OUTPUT = None + +preview_label = None +preview_slider = None +source_label = None +target_label = None +status_label = None + + +# todo: remove by native support -> https://github.com/TomSchimansky/CustomTkinter/issues/934 +class CTk(ctk.CTk, TkinterDnD.DnDWrapper): + def __init__(self, *args: Any, **kwargs: Any) -> None: + super().__init__(*args, **kwargs) + self.TkdndVersion = TkinterDnD._require(self) + + +def init(start: Callable[[], None], destroy: Callable[[], None]) -> ctk.CTk: + global ROOT, PREVIEW + + ROOT = create_root(start, destroy) + PREVIEW = create_preview(ROOT) + + return ROOT + + +def create_root(start: Callable[[], None], destroy: Callable[[], None]) -> ctk.CTk: + global source_label, target_label, status_label + + ctk.deactivate_automatic_dpi_awareness() + ctk.set_appearance_mode('system') + ctk.set_default_color_theme(resolve_relative_path('ui.json')) + + root = CTk() + root.minsize(ROOT_WIDTH, ROOT_HEIGHT) + root.title(f'{roop.metadata.name} {roop.metadata.version}') + root.configure() + root.protocol('WM_DELETE_WINDOW', lambda: destroy()) + + source_label = ctk.CTkLabel(root, text=None, fg_color=ctk.ThemeManager.theme.get('RoopDropArea').get('fg_color')) + source_label.place(relx=0.1, rely=0.1, relwidth=0.3, relheight=0.25) + source_label.drop_target_register(DND_ALL) + source_label.dnd_bind('<<Drop>>', lambda event: select_source_path(event.data)) + if roop.globals.source_path: + select_source_path(roop.globals.source_path) + + target_label = ctk.CTkLabel(root, text=None, fg_color=ctk.ThemeManager.theme.get('RoopDropArea').get('fg_color')) + target_label.place(relx=0.6, rely=0.1, relwidth=0.3, relheight=0.25) + target_label.drop_target_register(DND_ALL) + target_label.dnd_bind('<<Drop>>', lambda event: select_target_path(event.data)) + if roop.globals.target_path: + select_target_path(roop.globals.target_path) + + source_button = ctk.CTkButton(root, text='Select a face', cursor='hand2', command=lambda: select_source_path()) + source_button.place(relx=0.1, rely=0.4, relwidth=0.3, relheight=0.1) + + target_button = ctk.CTkButton(root, text='Select a target', cursor='hand2', command=lambda: select_target_path()) + target_button.place(relx=0.6, rely=0.4, relwidth=0.3, relheight=0.1) + + keep_fps_value = ctk.BooleanVar(value=roop.globals.keep_fps) + keep_fps_checkbox = ctk.CTkSwitch(root, text='Keep target fps', variable=keep_fps_value, cursor='hand2', command=lambda: setattr(roop.globals, 'keep_fps', not roop.globals.keep_fps)) + keep_fps_checkbox.place(relx=0.1, rely=0.6) + + keep_frames_value = ctk.BooleanVar(value=roop.globals.keep_frames) + keep_frames_switch = ctk.CTkSwitch(root, text='Keep temporary frames', variable=keep_frames_value, cursor='hand2', command=lambda: setattr(roop.globals, 'keep_frames', keep_frames_value.get())) + keep_frames_switch.place(relx=0.1, rely=0.65) + + skip_audio_value = ctk.BooleanVar(value=roop.globals.skip_audio) + skip_audio_switch = ctk.CTkSwitch(root, text='Skip target audio', variable=skip_audio_value, cursor='hand2', command=lambda: setattr(roop.globals, 'skip_audio', skip_audio_value.get())) + skip_audio_switch.place(relx=0.6, rely=0.6) + + many_faces_value = ctk.BooleanVar(value=roop.globals.many_faces) + many_faces_switch = ctk.CTkSwitch(root, text='Many faces', variable=many_faces_value, cursor='hand2', command=lambda: setattr(roop.globals, 'many_faces', many_faces_value.get())) + many_faces_switch.place(relx=0.6, rely=0.65) + + start_button = ctk.CTkButton(root, text='Start', cursor='hand2', command=lambda: select_output_path(start)) + start_button.place(relx=0.15, rely=0.75, relwidth=0.2, relheight=0.05) + + stop_button = ctk.CTkButton(root, text='Destroy', cursor='hand2', command=lambda: destroy()) + stop_button.place(relx=0.4, rely=0.75, relwidth=0.2, relheight=0.05) + + preview_button = ctk.CTkButton(root, text='Preview', cursor='hand2', command=lambda: toggle_preview()) + preview_button.place(relx=0.65, rely=0.75, relwidth=0.2, relheight=0.05) + + status_label = ctk.CTkLabel(root, text=None, justify='center') + status_label.place(relx=0.1, rely=0.9, relwidth=0.8) + + donate_label = ctk.CTkLabel(root, text='^_^ Donate to project ^_^', justify='center', cursor='hand2') + donate_label.place(relx=0.1, rely=0.95, relwidth=0.8) + donate_label.configure(text_color=ctk.ThemeManager.theme.get('RoopDonate').get('text_color')) + donate_label.bind('<Button>', lambda event: webbrowser.open('https://github.com/sponsors/s0md3v')) + + return root + + +def create_preview(parent: ctk.CTkToplevel) -> ctk.CTkToplevel: + global preview_label, preview_slider + + preview = ctk.CTkToplevel(parent) + preview.withdraw() + preview.configure() + preview.protocol('WM_DELETE_WINDOW', lambda: toggle_preview()) + preview.resizable(width=False, height=False) + + preview_label = ctk.CTkLabel(preview, text=None) + preview_label.pack(fill='both', expand=True) + + preview_slider = ctk.CTkSlider(preview, from_=0, to=0, command=lambda frame_value: update_preview(frame_value)) + + preview.bind('<Up>', lambda event: update_face_reference(1)) + preview.bind('<Down>', lambda event: update_face_reference(-1)) + return preview + + +def update_status(text: str) -> None: + status_label.configure(text=text) + ROOT.update() + + +def select_source_path(source_path: Optional[str] = None) -> None: + global RECENT_DIRECTORY_SOURCE + + if PREVIEW: + PREVIEW.withdraw() + if source_path is None: + source_path = ctk.filedialog.askopenfilename(title='select an source image', initialdir=RECENT_DIRECTORY_SOURCE) + if is_image(source_path): + roop.globals.source_path = source_path + RECENT_DIRECTORY_SOURCE = os.path.dirname(roop.globals.source_path) + image = render_image_preview(roop.globals.source_path, (200, 200)) + source_label.configure(image=image) + else: + roop.globals.source_path = None + source_label.configure(image=None) + + +def select_target_path(target_path: Optional[str] = None) -> None: + global RECENT_DIRECTORY_TARGET + + if PREVIEW: + PREVIEW.withdraw() + clear_face_reference() + if target_path is None: + target_path = ctk.filedialog.askopenfilename(title='select an target image or video', initialdir=RECENT_DIRECTORY_TARGET) + if is_image(target_path): + roop.globals.target_path = target_path + RECENT_DIRECTORY_TARGET = os.path.dirname(roop.globals.target_path) + image = render_image_preview(roop.globals.target_path, (200, 200)) + target_label.configure(image=image) + elif is_video(target_path): + roop.globals.target_path = target_path + RECENT_DIRECTORY_TARGET = os.path.dirname(roop.globals.target_path) + video_frame = render_video_preview(target_path, (200, 200)) + target_label.configure(image=video_frame) + else: + roop.globals.target_path = None + target_label.configure(image=None) + + +def select_output_path(start: Callable[[], None]) -> None: + global RECENT_DIRECTORY_OUTPUT + + if is_image(roop.globals.target_path): + output_path = ctk.filedialog.asksaveasfilename(title='save image output file', defaultextension='.png', initialfile='output.png', initialdir=RECENT_DIRECTORY_OUTPUT) + elif is_video(roop.globals.target_path): + output_path = ctk.filedialog.asksaveasfilename(title='save video output file', defaultextension='.mp4', initialfile='output.mp4', initialdir=RECENT_DIRECTORY_OUTPUT) + else: + output_path = None + if output_path: + roop.globals.output_path = output_path + RECENT_DIRECTORY_OUTPUT = os.path.dirname(roop.globals.output_path) + start() + + +def render_image_preview(image_path: str, size: Tuple[int, int]) -> ctk.CTkImage: + image = Image.open(image_path) + if size: + image = ImageOps.fit(image, size, Image.LANCZOS) + return ctk.CTkImage(image, size=image.size) + + +def render_video_preview(video_path: str, size: Tuple[int, int], frame_number: int = 0) -> ctk.CTkImage: + capture = cv2.VideoCapture(video_path) + if frame_number: + capture.set(cv2.CAP_PROP_POS_FRAMES, frame_number) + has_frame, frame = capture.read() + if has_frame: + image = Image.fromarray(cv2.cvtColor(frame, cv2.COLOR_BGR2RGB)) + if size: + image = ImageOps.fit(image, size, Image.LANCZOS) + return ctk.CTkImage(image, size=image.size) + capture.release() + cv2.destroyAllWindows() + + +def toggle_preview() -> None: + if PREVIEW.state() == 'normal': + PREVIEW.unbind('<Right>') + PREVIEW.unbind('<Left>') + PREVIEW.withdraw() + clear_predictor() + elif roop.globals.source_path and roop.globals.target_path: + init_preview() + update_preview(roop.globals.reference_frame_number) + PREVIEW.deiconify() + + +def init_preview() -> None: + PREVIEW.title('Preview [ ↕ Reference face ]') + if is_image(roop.globals.target_path): + preview_slider.pack_forget() + if is_video(roop.globals.target_path): + video_frame_total = get_video_frame_total(roop.globals.target_path) + if video_frame_total > 0: + PREVIEW.title('Preview [ ↕ Reference face ] [ ↔ Frame number ]') + PREVIEW.bind('<Right>', lambda event: update_frame(int(video_frame_total / 20))) + PREVIEW.bind('<Left>', lambda event: update_frame(int(video_frame_total / -20))) + preview_slider.configure(to=video_frame_total) + preview_slider.pack(fill='x') + preview_slider.set(roop.globals.reference_frame_number) + + +def update_preview(frame_number: int = 0) -> None: + if roop.globals.source_path and roop.globals.target_path: + temp_frame = get_video_frame(roop.globals.target_path, frame_number) + if predict_frame(temp_frame): + sys.exit() + source_face = get_one_face(cv2.imread(roop.globals.source_path)) + if not get_face_reference(): + reference_frame = get_video_frame(roop.globals.target_path, roop.globals.reference_frame_number) + reference_face = get_one_face(reference_frame, roop.globals.reference_face_position) + set_face_reference(reference_face) + else: + reference_face = get_face_reference() + for frame_processor in get_frame_processors_modules(roop.globals.frame_processors): + temp_frame = frame_processor.process_frame( + source_face, + reference_face, + temp_frame + ) + image = Image.fromarray(cv2.cvtColor(temp_frame, cv2.COLOR_BGR2RGB)) + image = ImageOps.contain(image, (PREVIEW_MAX_WIDTH, PREVIEW_MAX_HEIGHT), Image.LANCZOS) + image = ctk.CTkImage(image, size=image.size) + preview_label.configure(image=image) + + +def update_face_reference(steps: int) -> None: + clear_face_reference() + reference_frame_number = int(preview_slider.get()) + roop.globals.reference_face_position += steps + roop.globals.reference_frame_number = reference_frame_number + update_preview(reference_frame_number) + + +def update_frame(steps: int) -> None: + frame_number = preview_slider.get() + steps + preview_slider.set(frame_number) + update_preview(preview_slider.get()) diff --git a/roop/utilities.py b/roop/utilities.py new file mode 100644 index 0000000000000000000000000000000000000000..ac0ed0daa52c9c608bba7a00e1dd6a3dde1b0100 --- /dev/null +++ b/roop/utilities.py @@ -0,0 +1,149 @@ +import glob +import mimetypes +import os +import platform +import shutil +import ssl +import subprocess +import urllib +from pathlib import Path +from typing import List, Optional +from tqdm import tqdm + +import roop.globals + +TEMP_DIRECTORY = 'temp' +TEMP_VIDEO_FILE = 'temp.mp4' + +# monkey patch ssl for mac +if platform.system().lower() == 'darwin': + ssl._create_default_https_context = ssl._create_unverified_context + + +def run_ffmpeg(args: List[str]) -> bool: + commands = ['ffmpeg', '-hide_banner', '-loglevel', roop.globals.log_level] + commands.extend(args) + try: + subprocess.check_output(commands, stderr=subprocess.STDOUT) + return True + except Exception: + pass + return False + + +def detect_fps(target_path: str) -> float: + command = ['ffprobe', '-v', 'error', '-select_streams', 'v:0', '-show_entries', 'stream=r_frame_rate', '-of', 'default=noprint_wrappers=1:nokey=1', target_path] + output = subprocess.check_output(command).decode().strip().split('/') + try: + numerator, denominator = map(int, output) + return numerator / denominator + except Exception: + pass + return 30 + + +def extract_frames(target_path: str, fps: float = 30) -> bool: + temp_directory_path = get_temp_directory_path(target_path) + temp_frame_quality = roop.globals.temp_frame_quality * 31 // 100 + return run_ffmpeg(['-hwaccel', 'auto', '-i', target_path, '-q:v', str(temp_frame_quality), '-pix_fmt', 'rgb24', '-vf', 'fps=' + str(fps), os.path.join(temp_directory_path, '%04d.' + roop.globals.temp_frame_format)]) + + +def create_video(target_path: str, fps: float = 30) -> bool: + temp_output_path = get_temp_output_path(target_path) + temp_directory_path = get_temp_directory_path(target_path) + output_video_quality = (roop.globals.output_video_quality + 1) * 51 // 100 + commands = ['-hwaccel', 'auto', '-r', str(fps), '-i', os.path.join(temp_directory_path, '%04d.' + roop.globals.temp_frame_format), '-c:v', roop.globals.output_video_encoder] + if roop.globals.output_video_encoder in ['libx264', 'libx265', 'libvpx']: + commands.extend(['-crf', str(output_video_quality)]) + if roop.globals.output_video_encoder in ['h264_nvenc', 'hevc_nvenc']: + commands.extend(['-cq', str(output_video_quality)]) + commands.extend(['-pix_fmt', 'yuv420p', '-vf', 'colorspace=bt709:iall=bt601-6-625:fast=1', '-y', temp_output_path]) + return run_ffmpeg(commands) + + +def restore_audio(target_path: str, output_path: str) -> None: + temp_output_path = get_temp_output_path(target_path) + done = run_ffmpeg(['-hwaccel', 'auto', '-i', temp_output_path, '-i', target_path, '-c:v', 'copy', '-map', '0:v:0', '-map', '1:a:0', '-y', output_path]) + if not done: + move_temp(target_path, output_path) + + +def get_temp_frame_paths(target_path: str) -> List[str]: + temp_directory_path = get_temp_directory_path(target_path) + return glob.glob((os.path.join(glob.escape(temp_directory_path), '*.' + roop.globals.temp_frame_format))) + + +def get_temp_directory_path(target_path: str) -> str: + target_name, _ = os.path.splitext(os.path.basename(target_path)) + target_directory_path = os.path.dirname(target_path) + return os.path.join(target_directory_path, TEMP_DIRECTORY, target_name) + + +def get_temp_output_path(target_path: str) -> str: + temp_directory_path = get_temp_directory_path(target_path) + return os.path.join(temp_directory_path, TEMP_VIDEO_FILE) + + +def normalize_output_path(source_path: str, target_path: str, output_path: str) -> Optional[str]: + if source_path and target_path and output_path: + source_name, _ = os.path.splitext(os.path.basename(source_path)) + target_name, target_extension = os.path.splitext(os.path.basename(target_path)) + if os.path.isdir(output_path): + return os.path.join(output_path, source_name + '-' + target_name + target_extension) + return output_path + + +def create_temp(target_path: str) -> None: + temp_directory_path = get_temp_directory_path(target_path) + Path(temp_directory_path).mkdir(parents=True, exist_ok=True) + + +def move_temp(target_path: str, output_path: str) -> None: + temp_output_path = get_temp_output_path(target_path) + if os.path.isfile(temp_output_path): + if os.path.isfile(output_path): + os.remove(output_path) + shutil.move(temp_output_path, output_path) + + +def clean_temp(target_path: str) -> None: + temp_directory_path = get_temp_directory_path(target_path) + parent_directory_path = os.path.dirname(temp_directory_path) + if not roop.globals.keep_frames and os.path.isdir(temp_directory_path): + shutil.rmtree(temp_directory_path) + if os.path.exists(parent_directory_path) and not os.listdir(parent_directory_path): + os.rmdir(parent_directory_path) + + +def has_image_extension(image_path: str) -> bool: + return image_path.lower().endswith(('png', 'jpg', 'jpeg', 'webp')) + + +def is_image(image_path: str) -> bool: + if image_path and os.path.isfile(image_path): + mimetype, _ = mimetypes.guess_type(image_path) + return bool(mimetype and mimetype.startswith('image/')) + return False + + +def is_video(video_path: str) -> bool: + if video_path and os.path.isfile(video_path): + mimetype, _ = mimetypes.guess_type(video_path) + return bool(mimetype and mimetype.startswith('video/')) + return False + + +def conditional_download(download_directory_path: str, urls: List[str]) -> None: + if not os.path.exists(download_directory_path): + os.makedirs(download_directory_path) + for url in urls: + download_file_path = os.path.join(download_directory_path, os.path.basename(url)) + if not os.path.exists(download_file_path): + request = urllib.request.urlopen(url) # type: ignore[attr-defined] + total = int(request.headers.get('Content-Length', 0)) + with tqdm(total=total, desc='Downloading', unit='B', unit_scale=True, unit_divisor=1024) as progress: + urllib.request.urlretrieve(url, download_file_path, reporthook=lambda count, block_size, total_size: progress.update(block_size)) # type: ignore[attr-defined] + + +def resolve_relative_path(path: str) -> str: + return os.path.abspath(os.path.join(os.path.dirname(__file__), path)) diff --git a/run.py b/run.py new file mode 100644 index 0000000000000000000000000000000000000000..b52e5cc4a8ea9ce5cadd4e7111fb15531f380314 --- /dev/null +++ b/run.py @@ -0,0 +1,6 @@ +#!/usr/bin/env python3 + +from roop import core + +if __name__ == '__main__': + core.run() diff --git a/templates/error.html b/templates/error.html new file mode 100644 index 0000000000000000000000000000000000000000..209ed146496710eb70ff3b72a9c0320723fe3c7d --- /dev/null +++ b/templates/error.html @@ -0,0 +1,67 @@ +<!DOCTYPE html> +<html lang="en"> +<head> + <meta charset="UTF-8"> + <meta name="viewport" content="width=device-width, initial-scale=1.0"> + <title>Error</title> + <style> + body { + font-family: 'Segoe UI', Arial, sans-serif; + background-color: #f8f8f8; + margin: 0; + padding: 0; + display: flex; + justify-content: center; + align-items: center; + min-height: 100vh; + } + #container { + width: 90%; + max-width: 800px; + padding: 20px; + background-color: #ffffff; + border-radius: 10px; + box-shadow: 0px 0px 20px rgba(0, 0, 0, 0.1); + } + h1 { + text-align: center; + color: #333333; + margin-bottom: 20px; + } + #errorMessage { + text-align: center; + margin-top: 20px; + color: #cc0000; + } + #backButton { + text-align: center; + margin-top: 25px; + } + #backButton a { + text-decoration: none; + background-color: #4285f4; + color: white; + border: none; + padding: 10px 20px; + cursor: pointer; + border-radius: 5px; + font-weight: bold; + transition: background-color 0.3s; + } + #backButton a:hover { + background-color: #2a75d7; + } + </style> +</head> +<body> + <div id="container"> + <h1>Error</h1> + <div id="errorMessage"> + An error occurred while processing the images/videos. + </div> + <div id="backButton"> + <a href="/">Back to Processing</a> + </div> + </div> +</body> +</html> diff --git a/templates/index.html b/templates/index.html new file mode 100644 index 0000000000000000000000000000000000000000..8cad500f4c0995401075f004f8dd35c98edf69e1 --- /dev/null +++ b/templates/index.html @@ -0,0 +1,116 @@ +<!DOCTYPE html> +<html lang="en"> +<head> + <meta charset="UTF-8"> + <meta name="viewport" content="width=device-width, initial-scale=1.0"> + <title>Image and Video Processing</title> + <style> + body { + font-family: 'Segoe UI', Arial, sans-serif; + background-color: #f8f8f8; + margin: 0; + padding: 0; + display: flex; + justify-content: center; + align-items: center; + min-height: 100vh; + } + #container { + width: 90%; + max-width: 800px; + padding: 20px; + background-color: #ffffff; + border-radius: 10px; + box-shadow: 0px 0px 20px rgba(0, 0, 0, 0.1); + } + h1 { + text-align: center; + color: #333333; + margin-bottom: 30px; + } + label { + font-weight: bold; + color: #444444; + display: block; + margin-bottom: 5px; + } + input[type="file"] { + display: block; + margin-bottom: 15px; + width: 100%; + } + input[type="checkbox"] { + margin-right: 8px; + } + input[type="submit"] { + background-color: #4285f4; + color: white; + border: none; + padding: 12px 25px; + cursor: pointer; + border-radius: 5px; + font-weight: bold; + transition: background-color 0.3s; + width: 100%; + } + input[type="submit"]:hover { + background-color: #2a75d7; + } + #preview { + text-align: center; + margin-top: 20px; + } + #preview img { + max-width: 100%; + max-height: 300px; + margin-top: 15px; + border: 1px solid #ddd; + border-radius: 5px; + } + </style> + <script> + function previewImage(input, previewId) { + var preview = document.getElementById(previewId); + var file = input.files[0]; + var reader = new FileReader(); + + reader.onload = function(e) { + var image = new Image(); + image.src = e.target.result; + preview.innerHTML = ''; + preview.appendChild(image); + }; + + reader.readAsDataURL(file); + } + </script> +</head> +<body> + <div id="container"> + <h1>Image and Video Processing</h1> + <form method="post" enctype="multipart/form-data"> + <label for="source">Upload Source Image/Video:</label> + <input type="file" id="source" name="source" onchange="previewImage(this, 'sourcePreview')"> + <div id="sourcePreview"></div> + + <label for="target">Upload Target Image/Video:</label> + <input type="file" id="target" name="target" onchange="previewImage(this, 'targetPreview')"> + <div id="targetPreview"></div> + + <label>Frame Processors:</label> + <div style="display: flex; align-items: center;"> + <input type="checkbox" id="face_swapper" name="frame_processor" value="face_swapper"> + <label for="face_swapper">Face Swapper</label> + </div> + <div style="display: flex; align-items: center;"> + <input type="checkbox" id="face_enhancer" name="frame_processor" value="face_enhancer"> + <label for="face_enhancer">Face Enhancer</label> + </div> + + <div style="text-align: center; margin-top: 25px;"> + <input type="submit" value="Process"> + </div> + </form> + </div> +</body> +</html> diff --git a/templates/output.html b/templates/output.html new file mode 100644 index 0000000000000000000000000000000000000000..d1e98ac82005eb5420e35732c2729520b82d94ff --- /dev/null +++ b/templates/output.html @@ -0,0 +1,72 @@ +<!DOCTYPE html> +<html lang="en"> +<head> + <meta charset="UTF-8"> + <meta name="viewport" content="width=device-width, initial-scale=1.0"> + <title>Output</title> + <style> + body { + font-family: 'Segoe UI', Arial, sans-serif; + background-color: #f8f8f8; + margin: 0; + padding: 0; + display: flex; + justify-content: center; + align-items: center; + min-height: 100vh; + } + #container { + width: 90%; + max-width: 800px; + padding: 20px; + background-color: #ffffff; + border-radius: 10px; + box-shadow: 0px 0px 20px rgba(0, 0, 0, 0.1); + } + h1 { + text-align: center; + color: #333333; + margin-bottom: 30px; + } + #outputImage { + text-align: center; + margin-top: 20px; + } + #outputImage img { + max-width: 100%; + max-height: 300px; + border: 1px solid #ddd; + border-radius: 5px; + } + #backButton { + text-align: center; + margin-top: 25px; + } + #backButton a { + text-decoration: none; + background-color: #4285f4; + color: white; + border: none; + padding: 10px 20px; + cursor: pointer; + border-radius: 5px; + font-weight: bold; + transition: background-color 0.3s; + } + #backButton a:hover { + background-color: #2a75d7; + } + </style> +</head> +<body> + <div id="container"> + <h1>Output</h1> + <div id="outputImage"> + <img src="{{ url_for('output_image', filename=filename) }}" alt="Output Image"> + </div> + <div id="backButton"> + <a href="/">Back to Processing</a> + </div> + </div> +</body> +</html> diff --git a/uploads/1685074910001_vtqikl_2_0.jpg b/uploads/1685074910001_vtqikl_2_0.jpg new file mode 100644 index 0000000000000000000000000000000000000000..f0df550c5d722dde2ed7530078705b7efc2a3ed1 --- /dev/null +++ b/uploads/1685074910001_vtqikl_2_0.jpg @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9b3f2abd31fbd26820ab65bd35b8defe9eff62f06af23c9fb0e69f7955f89787 +size 1091281 diff --git a/uploads/20230518_174347_0000.png b/uploads/20230518_174347_0000.png new file mode 100644 index 0000000000000000000000000000000000000000..6eae8accb453da4386d45c6a066e991ed9d53814 --- /dev/null +++ b/uploads/20230518_174347_0000.png @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:80738f0e0709f78fc1b2823b394dfe650d829000e5dc7c2d76468a16a328802c +size 3245104 diff --git a/uploads/FB_IMG_1690825211219.jpg b/uploads/FB_IMG_1690825211219.jpg new file mode 100644 index 0000000000000000000000000000000000000000..794d2b1e8084f92999785b7c8bf7049806d2ed8d Binary files /dev/null and b/uploads/FB_IMG_1690825211219.jpg differ diff --git a/uploads/kashmirtweetsofficial-20230530-0001.mp4 b/uploads/kashmirtweetsofficial-20230530-0001.mp4 new file mode 100644 index 0000000000000000000000000000000000000000..da6f97015d32f3351b41f5222148031ff8118369 Binary files /dev/null and b/uploads/kashmirtweetsofficial-20230530-0001.mp4 differ diff --git a/uploads/output b/uploads/output new file mode 100644 index 0000000000000000000000000000000000000000..794d2b1e8084f92999785b7c8bf7049806d2ed8d Binary files /dev/null and b/uploads/output differ