From f3ff47c11b2a42095cc6ec78d9d46a2c4177e3cf Mon Sep 17 00:00:00 2001 From: pokepress <69562368+pokepress@users.noreply.github.com> Date: Mon, 27 Jan 2025 20:31:36 -0600 Subject: [PATCH] =?UTF-8?q?Add=20NES=20Composite=20to=20RGB=20Model,=20Dig?= =?UTF-8?q?ital=20Pok=C3=A9mon=20Models=20(#464)?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit * Adds the models I created for the Super Mario Bros Super Show. Note that the large model is actually a 2x model, but I used a 4x model as the base (apparently that's allowed). Each entry has two resources because there is a live-action and animated model (users are expected to interpolate them for things like the opening sequence). * Rename large model file to avoid confusion * Add NES Composite to RGB Model * Add Digital Pokemon models --- data/models/1x-NES-Composite-2-RGB.json | 53 ++++++++++++++++++++++ data/models/2x-DigitalPokemon-l.json | 59 +++++++++++++++++++++++++ data/models/2x-DigitalPokemon-s.json | 59 +++++++++++++++++++++++++ 3 files changed, 171 insertions(+) create mode 100644 data/models/1x-NES-Composite-2-RGB.json create mode 100644 data/models/2x-DigitalPokemon-l.json create mode 100644 data/models/2x-DigitalPokemon-s.json diff --git a/data/models/1x-NES-Composite-2-RGB.json b/data/models/1x-NES-Composite-2-RGB.json new file mode 100644 index 0000000..5ca10c3 --- /dev/null +++ b/data/models/1x-NES-Composite-2-RGB.json @@ -0,0 +1,53 @@ +{ + "name": "NES Composite to RGB", + "author": "pokepress", + "license": "MIT", + "tags": [ + "debanding", + "denoise", + "restoration", + "video-frame" + ], + "description": "Takes composite/RF/VHS NES footage and attempts to restore it to RGB quality. Assumes footage has been properly deinterlaced via field duplication from 240p to 480p. Note that:\n\n* All footage was captured in 240p/480p NTSC.\n* RGB footage was captured via an AV Famicom with the RGB Blaster via the Retrotink 2x.\n* The model was trained exclusively on individual frames, so it can't fix things like dropouts.\n* The even and odd fields of NES composite tend to be a bit...different from each other, so there will be some jitter at 60fps.\n* I don't have access to an NES Toploader, so I wouldn't expect it to fix the jailbars very well.", + "date": "2024-11-03", + "architecture": "omnisr", + "size": null, + "scale": 1, + "inputChannels": 3, + "outputChannels": 3, + "resources": [ + { + "platform": "pytorch", + "type": "pth", + "size": 3223546, + "sha256": "77511d759530b0cef77c919c40870f3fe3b9330e39e2aaacaac7848c06fb2b20", + "urls": [ + "https://www.mediafire.com/file/qzaox0y51zh9ja7/NES_Composite_to_RGB.pth/file" + ] + } + ], + "trainingIterations": 445000, + "trainingHRSize": 128, + "trainingOTF": false, + "dataset": "Screenshots of NES games", + "datasetSize": 194, + "images": [ + { + "type": "paired", + "LR": "https://imgsli.com/i/ce97c530-8f99-448c-8101-e072b7f72851.jpg", + "SR": "https://imgsli.com/i/e3b66191-0e6e-4264-a97f-d7b79c8a2f23.jpg" + }, + { + "type": "paired", + "caption": "Legacy of the Wizard (VHS)", + "LR": "https://imgsli.com/i/0e8cc744-8e50-4b4c-8a0a-ccca9ffb9ea3.jpg", + "SR": "https://imgsli.com/i/d730abc1-ce80-495d-8a79-1504c6f7df33.jpg" + }, + { + "type": "paired", + "caption": "Defender of the Crown (RF)", + "LR": "https://imgsli.com/i/0f0d8130-cc2b-4e3a-afad-45aa6bf5c504.jpg", + "SR": "https://imgsli.com/i/4416deb1-bbed-49a2-b882-45179b301b46.jpg" + } + ] +} \ No newline at end of file diff --git a/data/models/2x-DigitalPokemon-l.json b/data/models/2x-DigitalPokemon-l.json new file mode 100644 index 0000000..67daed2 --- /dev/null +++ b/data/models/2x-DigitalPokemon-l.json @@ -0,0 +1,59 @@ +{ + "name": "Digital Pokémon-Large", + "author": "pokepress", + "license": "MIT", + "tags": [ + "anime", + "cartoon", + "general-upscaler" + ], + "description": "This model is designed to upscale the standard definition digital era of the Pokémon anime, which runs from late season 5 (Master Quest) to early season 12 (Galactic Battles). During this time, the show was animated digitally in a 4:3 ratio. This process was also used for Mewtwo Returns, most of Pokémon Chronicles, and the Mystery Dungeon specials.\n\nAdvice/Known Limitations:\n* This OmniSR model can occasionally produce black frames when run in fp16 mode. This seems to be more common in the TPCi era (seasons 9 and later). The issue is sporadic enough that it probably makes sense to do a first pass in fp16, then re-upscale any affected shots in fp32.\n* I recommend using QTGMC on a preset of \"Slow\" or slower for deinterlacing. While the show is primarily animated at 12/24 fps, some elements like backgrounds are animated at a full 60i.\n* The model is not great at handling fonts, particularly the italicized text in the episode credits. This is despite including font images in the training data,.", + "date": "2025-01-05", + "architecture": "omnisr", + "size": null, + "scale": 2, + "inputChannels": 3, + "outputChannels": 3, + "resources": [ + { + "platform": "pytorch", + "type": "pth", + "size": 3244282, + "sha256": "ff5e8f803b6153b0c16ba246c5579524a978d16a90545d2736603703d9d67a2a", + "urls": [ + "https://www.mediafire.com/file/gckgn1299krt2so/digital_pokemon_omnisr.pth/file" + ] + } + ], + "trainingIterations": 465000, + "trainingHRSize": 64, + "trainingOTF": false, + "dataset": "Screenshots from seasons 6-11 of the English Pokémon dub, plus some manually created images for fonts.", + "datasetSize": 74, + "images": [ + { + "type": "paired", + "caption": "A Bite to Remember", + "LR": "https://imgsli.com/i/9ae50058-ac4a-415a-a243-8f924015fd46.jpg", + "SR": "https://imgsli.com/i/d96a8dcd-5b70-464f-8b45-2ed443f8fa3d.jpg" + }, + { + "type": "paired", + "caption": "Going, Going, Yawn Title Card", + "LR": "https://imgsli.com/i/64ed6a26-8fb9-4849-996d-2d240b3eda97.jpg", + "SR": "https://imgsli.com/i/aea9dd40-c261-41d4-93d0-bea5f702700b.jpg" + }, + { + "type": "paired", + "caption": "Fear Factor Phony!", + "LR": "https://imgsli.com/i/165ae236-385e-4519-b062-d7e8ec21d797.jpg", + "SR": "https://imgsli.com/i/fcbae9aa-dd0d-4c50-9071-86c8299f5b25.jpg" + }, + { + "type": "paired", + "caption": "Once There Were Greenfields", + "LR": "https://imgsli.com/i/91270773-c8e9-4ea3-a679-ce1acde79b60.jpg", + "SR": "https://imgsli.com/i/1498de96-c924-4fba-b7cb-3b128e765d05.jpg" + } + ] +} \ No newline at end of file diff --git a/data/models/2x-DigitalPokemon-s.json b/data/models/2x-DigitalPokemon-s.json new file mode 100644 index 0000000..267e08e --- /dev/null +++ b/data/models/2x-DigitalPokemon-s.json @@ -0,0 +1,59 @@ +{ + "name": "Digital Pokémon-Small", + "author": "pokepress", + "license": "MIT", + "tags": [ + "anime", + "cartoon", + "general-upscaler" + ], + "description": "This model is designed to upscale the standard definition digital era of the Pokémon anime, which runs from late season 5 (Master Quest) to early season 12 (Galactic Battles). During this time, the show was animated digitally in a 4:3 ratio. This process was also used for Mewtwo Returns, most of Pokémon Chronicles, and the Mystery Dungeon specials.\n\nAdvice/Known Limitations:\n* I recommend using QTGMC on a preset of \"Slow\" or slower for deinterlacing. While the show is primarily animated at 12/24 fps, some elements like backgrounds are animated at a full 60i.\n* The model is not great at handling fonts, particularly the italicized text in the episode credits. This is despite including font images in the training data,.", + "date": "2025-01-05", + "architecture": "compact", + "size": null, + "scale": 2, + "inputChannels": 3, + "outputChannels": 3, + "resources": [ + { + "platform": "pytorch", + "type": "pth", + "size": 2418324, + "sha256": "bfa3409a2a2306314645c65f6660cff2077bde1ba9dbbbf08248ecbace7ade3a", + "urls": [ + "https://www.mediafire.com/file/37n5iwfkrpqd3ef/digital_pokemon_compact.pth/file" + ] + } + ], + "trainingIterations": 230000, + "trainingHRSize": 64, + "trainingOTF": false, + "dataset": "Screenshots from seasons 6-11 of the English Pokémon dub, plus some manually created images for fonts.", + "datasetSize": 74, + "images": [ + { + "type": "paired", + "caption": "A Bite to Remember", + "LR": "https://imgsli.com/i/db8243fa-875a-410e-a3cd-fafbb3af9cb1.jpg", + "SR": "https://imgsli.com/i/08e7cfd5-a764-4db4-9184-a9392504af3c.jpg" + }, + { + "type": "paired", + "caption": "Going, Going, Yawn Title Card", + "LR": "https://imgsli.com/i/d36cf8f0-7755-443e-b248-c06e2a7c9449.jpg", + "SR": "https://imgsli.com/i/bdd8af00-b6c0-4a53-8465-bfa82c5fe0c3.jpg" + }, + { + "type": "paired", + "caption": "Fear Factor Phony!", + "LR": "https://imgsli.com/i/2d6cacbe-91e9-4564-a197-9a86d9ed4c60.jpg", + "SR": "https://imgsli.com/i/e7623bdb-6aec-4b83-bb90-8e7b0a4a63fd.jpg" + }, + { + "type": "paired", + "caption": "Once There Were Greenfields", + "LR": "https://imgsli.com/i/5a326f65-f23f-4eee-9538-94eba40d0c0b.jpg", + "SR": "https://imgsli.com/i/93ca0d6e-28ac-4eef-9227-8e828b90a045.jpg" + } + ] +} \ No newline at end of file