diff -Nru gallery-dl-1.23.2/CHANGELOG.md gallery-dl-1.24.0/CHANGELOG.md
--- gallery-dl-1.23.2/CHANGELOG.md	2022-10-01 11:22:01.000000000 +0000
+++ gallery-dl-1.24.0/CHANGELOG.md	2022-11-20 14:36:04.000000000 +0000
@@ -1,5 +1,121 @@
 # Changelog
 
+## 1.24.0 - 2022-11-20
+### Additions
+- [exhentai] add metadata to search results ([#3181](https://github.com/mikf/gallery-dl/issues/3181))
+- [gelbooru_v02] implement `notes` extraction
+- [instagram] add `guide` extractor ([#3192](https://github.com/mikf/gallery-dl/issues/3192))
+- [lolisafe] add support for xbunkr ([#3153](https://github.com/mikf/gallery-dl/issues/3153), [#3156](https://github.com/mikf/gallery-dl/issues/3156))
+- [mastodon] add `instance_remote` metadata field ([#3119](https://github.com/mikf/gallery-dl/issues/3119))
+- [nitter] add extractors for Nitter instances ([#2415](https://github.com/mikf/gallery-dl/issues/2415), [#2696](https://github.com/mikf/gallery-dl/issues/2696))
+- [pixiv] add support for new daily AI rankings category ([#3214](https://github.com/mikf/gallery-dl/issues/3214), [#3221](https://github.com/mikf/gallery-dl/issues/3221))
+- [twitter] add `avatar` and `background` extractors ([#349](https://github.com/mikf/gallery-dl/issues/349), [#3023](https://github.com/mikf/gallery-dl/issues/3023))
+- [uploadir] add support for `uploadir.com` ([#3162](https://github.com/mikf/gallery-dl/issues/3162))
+- [wallhaven] add `user` extractor ([#3212](https://github.com/mikf/gallery-dl/issues/3212), [#3213](https://github.com/mikf/gallery-dl/issues/3213), [#3226](https://github.com/mikf/gallery-dl/issues/3226))
+- [downloader:http] add `chunk-size` option ([#3143](https://github.com/mikf/gallery-dl/issues/3143))
+- [downloader:http] add file signature check for `.mp4` files
+- [downloader:http] add file signature check and MIME type for `.avif` files
+- [postprocessor] implement `post-after` event ([#3117](https://github.com/mikf/gallery-dl/issues/3117))
+- [postprocessor:metadata] implement `"mode": "jsonl"`
+- [postprocessor:metadata] add `open`, `encoding`, and `private` options
+- add `--chunk-size` command-line option ([#3143](https://github.com/mikf/gallery-dl/issues/3143))
+- add `--user-agent` command-line option
+- implement `http-metadata` option
+- implement `"user-agent": "browser"` ([#2636](https://github.com/mikf/gallery-dl/issues/2636))
+### Changes
+- [deviantart] restore cookies warning for mature scraps ([#3129](https://github.com/mikf/gallery-dl/issues/3129))
+- [instagram] use REST API for unauthenticated users by default
+- [downloader:http] increase default `chunk-size` to 32768 bytes ([#3143](https://github.com/mikf/gallery-dl/issues/3143))
+- build Windows executables using py2exe's new `freeze()` API
+- build executables on GitHub Actions with Python 3.11
+- reword error text for unsupported URLs
+### Fixes
+- [exhentai] fix pagination ([#3181](https://github.com/mikf/gallery-dl/issues/3181))
+- [khinsider] fix extraction ([#3215](https://github.com/mikf/gallery-dl/issues/3215), [#3219](https://github.com/mikf/gallery-dl/issues/3219))
+- [realbooru] fix download URLs ([#2530](https://github.com/mikf/gallery-dl/issues/2530))
+- [realbooru] fix `tags` extraction ([#2530](https://github.com/mikf/gallery-dl/issues/2530))
+- [tumblr] fall back to `gifv` when possible ([#3095](https://github.com/mikf/gallery-dl/issues/3095), [#3159](https://github.com/mikf/gallery-dl/issues/3159))
+- [twitter] fix login ([#3220](https://github.com/mikf/gallery-dl/issues/3220))
+- [twitter] update URL for syndication API ([#3160](https://github.com/mikf/gallery-dl/issues/3160))
+- [weibo] send `Referer` headers ([#3188](https://github.com/mikf/gallery-dl/issues/3188))
+- [ytdl] update `parse_bytes` location ([#3256](https://github.com/mikf/gallery-dl/issues/3256))
+### Improvements
+- [imxto] extract additional metadata ([#3118](https://github.com/mikf/gallery-dl/issues/3118), [#3175](https://github.com/mikf/gallery-dl/issues/3175))
+- [instagram] allow downloading avatars for private profiles ([#3255](https://github.com/mikf/gallery-dl/issues/3255))
+- [pixiv] raise error for invalid search/ranking parameters ([#3214](https://github.com/mikf/gallery-dl/issues/3214))
+- [twitter] update `bookmarks` pagination ([#3172](https://github.com/mikf/gallery-dl/issues/3172))
+- [downloader:http] refactor file signature checks
+- [downloader:http] improve `-r/--limit-rate` accuracy ([#3143](https://github.com/mikf/gallery-dl/issues/3143))
+- add loaded config files to debug output
+- improve `-K` output for lists
+### Removals
+- [instagram] remove login support ([#3139](https://github.com/mikf/gallery-dl/issues/3139), [#3141](https://github.com/mikf/gallery-dl/issues/3141), [#3191](https://github.com/mikf/gallery-dl/issues/3191))
+- [instagram] remove `channel` extractor
+- [ngomik] remove module
+
+## 1.23.5 - 2022-10-30
+### Fixes
+- [instagram] fix AttributeError on user stories extraction ([#3123](https://github.com/mikf/gallery-dl/issues/3123))
+
+## 1.23.4 - 2022-10-29
+### Additions
+- [aibooru] add support for aibooru.online ([#3075](https://github.com/mikf/gallery-dl/issues/3075))
+- [instagram] add 'avatar' extractor ([#929](https://github.com/mikf/gallery-dl/issues/929), [#1097](https://github.com/mikf/gallery-dl/issues/1097), [#2992](https://github.com/mikf/gallery-dl/issues/2992))
+- [instagram] support 'instagram.com/s/' highlight URLs ([#3076](https://github.com/mikf/gallery-dl/issues/3076))
+- [instagram] extract 'coauthors' metadata ([#3107](https://github.com/mikf/gallery-dl/issues/3107))
+- [mangasee] add support for 'mangalife' ([#3086](https://github.com/mikf/gallery-dl/issues/3086))
+- [mastodon] add 'bookmark' extractor ([#3109](https://github.com/mikf/gallery-dl/issues/3109))
+- [mastodon] support cross-instance user references and '/web/' URLs ([#3109](https://github.com/mikf/gallery-dl/issues/3109))
+- [moebooru] implement 'notes' extraction ([#3094](https://github.com/mikf/gallery-dl/issues/3094))
+- [pixiv] extend 'metadata' option ([#3057](https://github.com/mikf/gallery-dl/issues/3057))
+- [reactor] match 'best', 'new', 'all' URLs ([#3073](https://github.com/mikf/gallery-dl/issues/3073))
+- [smugloli] add 'smugloli' extractors ([#3060](https://github.com/mikf/gallery-dl/issues/3060))
+- [tumblr] add 'fallback-delay' and 'fallback-retries' options ([#2957](https://github.com/mikf/gallery-dl/issues/2957))
+- [vichan] add generic extractors for vichan imageboards
+### Fixes
+- [bcy] fix extraction ([#3103](https://github.com/mikf/gallery-dl/issues/3103))
+- [gelbooru] support alternate parameter order in post URLs ([#2821](https://github.com/mikf/gallery-dl/issues/2821))
+- [hentai2read] support minor versions in chapter URLs ([#3089](https://github.com/mikf/gallery-dl/issues/3089))
+- [hentaihere] support minor versions in chapter URLs
+- [kemonoparty] fix 'dms' extraction ([#3106](https://github.com/mikf/gallery-dl/issues/3106))
+- [kemonoparty] update pagination offset
+- [manganelo] update domain to 'chapmanganato.com' ([#3097](https://github.com/mikf/gallery-dl/issues/3097))
+- [pixiv] use 'exact_match_for_tags' as default search mode ([#3092](https://github.com/mikf/gallery-dl/issues/3092))
+- [redgifs] fix 'token' extraction ([#3080](https://github.com/mikf/gallery-dl/issues/3080), [#3081](https://github.com/mikf/gallery-dl/issues/3081))
+- [skeb] fix extraction ([#3112](https://github.com/mikf/gallery-dl/issues/3112))
+- improve compatibility of DownloadArchive ([#3078](https://github.com/mikf/gallery-dl/issues/3078))
+
+## 1.23.3 - 2022-10-15
+### Additions
+- [2chen] Add `2chen.moe` extractor ([#2707](https://github.com/mikf/gallery-dl/issues/2707))
+- [8chan] add `thread` and `board` extractors ([#2938](https://github.com/mikf/gallery-dl/issues/2938))
+- [deviantart] add `group` option ([#3018](https://github.com/mikf/gallery-dl/issues/3018))
+- [fanbox] add `content` metadata field ([#3020](https://github.com/mikf/gallery-dl/issues/3020))
+- [instagram] restore `cursor` functionality ([#2991](https://github.com/mikf/gallery-dl/issues/2991))
+- [instagram] restore warnings for private profiles ([#3004](https://github.com/mikf/gallery-dl/issues/3004), [#3045](https://github.com/mikf/gallery-dl/issues/3045))
+- [nana] add `nana` extractors ([#2967](https://github.com/mikf/gallery-dl/issues/2967))
+- [nijie] add `feed` and `followed` extractors ([#3048](https://github.com/mikf/gallery-dl/issues/3048))
+- [tumblr] support `https://www.tumblr.com/BLOGNAME` URLs ([#3034](https://github.com/mikf/gallery-dl/issues/3034))
+- [tumblr] add `offset` option
+- [vk] add `tagged` extractor ([#2997](https://github.com/mikf/gallery-dl/issues/2997))
+- add `path-extended` option ([#3021](https://github.com/mikf/gallery-dl/issues/3021))
+- emit debug logging messages before calling time.sleep() ([#2982](https://github.com/mikf/gallery-dl/issues/2982))
+### Changes
+- [postprocessor:metadata] assume `"mode": "custom"` when `format` is given
+### Fixes
+- [artstation] skip missing projects ([#3016](https://github.com/mikf/gallery-dl/issues/3016))
+- [danbooru] fix ugoira metadata extraction ([#3056](https://github.com/mikf/gallery-dl/issues/3056))
+- [deviantart] fix `deviation` extraction ([#2981](https://github.com/mikf/gallery-dl/issues/2981))
+- [hitomi] fall back to `webp` when selected format is not available ([#3030](https://github.com/mikf/gallery-dl/issues/3030))
+- [imagefap] fix and improve folder extraction and gallery pagination ([#3013](https://github.com/mikf/gallery-dl/issues/3013))
+- [instagram] fix login ([#3011](https://github.com/mikf/gallery-dl/issues/3011), [#3015](https://github.com/mikf/gallery-dl/issues/3015))
+- [nozomi] fix extraction ([#3051](https://github.com/mikf/gallery-dl/issues/3051))
+- [redgifs] fix extraction ([#3037](https://github.com/mikf/gallery-dl/issues/3037))
+- [tumblr] sleep between fallback retries ([#2957](https://github.com/mikf/gallery-dl/issues/2957))
+- [vk] unescape error messages
+- fix duplicated metadata bug with `-j` ([#3033](https://github.com/mikf/gallery-dl/issues/3033))
+- fix bug when processing input file comments ([#2808](https://github.com/mikf/gallery-dl/issues/2808))
+
 ## 1.23.2 - 2022-10-01
 ### Additions
 - [artstation] support search filters ([#2970](https://github.com/mikf/gallery-dl/issues/2970))
diff -Nru gallery-dl-1.23.2/data/completion/_gallery-dl gallery-dl-1.24.0/data/completion/_gallery-dl
--- gallery-dl-1.23.2/data/completion/_gallery-dl	2022-07-10 11:30:26.000000000 +0000
+++ gallery-dl-1.24.0/data/completion/_gallery-dl	2022-11-11 19:20:08.000000000 +0000
@@ -13,6 +13,7 @@
 {-f,--filename}'[Filename format string for downloaded files ("/O" for "original" filenames)]':'<format>' \
 --proxy'[Use the specified proxy]':'<url>' \
 --source-address'[Client-side IP address to bind to]':'<ip>' \
+--user-agent'[User-Agent request header]':'<ua>' \
 --clear-cache'[Delete cached login sessions, cookies, etc. for MODULE (ALL to delete everything)]':'<module>' \
 --cookies'[File to load additional cookies from]':'<file>':_files \
 --cookies-from-browser'[Name of the browser to load cookies from, with optional keyring name prefixed with "+" and profile prefixed with ":"]':'<browser[+keyring][:profile]>' \
@@ -37,6 +38,7 @@
 --sleep-extractor'[Number of seconds to wait before starting data extraction for an input URL]':'<seconds>' \
 --filesize-min'[Do not download files smaller than SIZE (e.g. 500k or 2.5M)]':'<size>' \
 --filesize-max'[Do not download files larger than SIZE (e.g. 500k or 2.5M)]':'<size>' \
+--chunk-size'[Size of in-memory data chunks (default: 32k)]':'<size>' \
 --no-part'[Do not use .part files]' \
 --no-skip'[Do not skip downloads; overwrite existing files]' \
 --no-mtime'[Do not set file modification times according to Last-Modified HTTP response headers]' \
diff -Nru gallery-dl-1.23.2/data/completion/gallery-dl gallery-dl-1.24.0/data/completion/gallery-dl
--- gallery-dl-1.23.2/data/completion/gallery-dl	2022-07-10 11:30:26.000000000 +0000
+++ gallery-dl-1.24.0/data/completion/gallery-dl	2022-11-11 19:20:08.000000000 +0000
@@ -10,7 +10,7 @@
     elif [[ "${prev}" =~ ^()$ ]]; then
         COMPREPLY=( $(compgen -d -- "${cur}") )
     else
-        COMPREPLY=( $(compgen -W "--help --version --input-file --destination --directory --filename --proxy --source-address --clear-cache --cookies --cookies-from-browser --quiet --verbose --get-urls --resolve-urls --dump-json --simulate --extractor-info --list-keywords --list-modules --list-extractors --write-log --write-unsupported --write-pages --limit-rate --retries --http-timeout --sleep --sleep-request --sleep-extractor --filesize-min --filesize-max --no-part --no-skip --no-mtime --no-download --no-postprocessors --no-check-certificate --config --config-yaml --option --ignore-config --username --password --netrc --download-archive --abort --terminate --range --chapter-range --filter --chapter-filter --zip --ugoira-conv --ugoira-conv-lossless --ugoira-conv-copy --write-metadata --write-info-json --write-infojson --write-tags --mtime-from-date --exec --exec-after --postprocessor" -- "${cur}") )
+        COMPREPLY=( $(compgen -W "--help --version --input-file --destination --directory --filename --proxy --source-address --user-agent --clear-cache --cookies --cookies-from-browser --quiet --verbose --get-urls --resolve-urls --dump-json --simulate --extractor-info --list-keywords --list-modules --list-extractors --write-log --write-unsupported --write-pages --limit-rate --retries --http-timeout --sleep --sleep-request --sleep-extractor --filesize-min --filesize-max --chunk-size --no-part --no-skip --no-mtime --no-download --no-postprocessors --no-check-certificate --config --config-yaml --option --ignore-config --username --password --netrc --download-archive --abort --terminate --range --chapter-range --filter --chapter-filter --zip --ugoira-conv --ugoira-conv-lossless --ugoira-conv-copy --write-metadata --write-info-json --write-infojson --write-tags --mtime-from-date --exec --exec-after --postprocessor" -- "${cur}") )
     fi
 }
 
diff -Nru gallery-dl-1.23.2/data/completion/gallery-dl.fish gallery-dl-1.24.0/data/completion/gallery-dl.fish
--- gallery-dl-1.23.2/data/completion/gallery-dl.fish	2022-07-10 11:30:26.000000000 +0000
+++ gallery-dl-1.24.0/data/completion/gallery-dl.fish	2022-11-11 19:20:08.000000000 +0000
@@ -7,6 +7,7 @@
 complete -c gallery-dl -x -s 'f' -l 'filename' -d 'Filename format string for downloaded files ("/O" for "original" filenames)'
 complete -c gallery-dl -x -l 'proxy' -d 'Use the specified proxy'
 complete -c gallery-dl -x -l 'source-address' -d 'Client-side IP address to bind to'
+complete -c gallery-dl -x -l 'user-agent' -d 'User-Agent request header'
 complete -c gallery-dl -x -l 'clear-cache' -d 'Delete cached login sessions, cookies, etc. for MODULE (ALL to delete everything)'
 complete -c gallery-dl -r -F -l 'cookies' -d 'File to load additional cookies from'
 complete -c gallery-dl -x -l 'cookies-from-browser' -d 'Name of the browser to load cookies from, with optional keyring name prefixed with "+" and profile prefixed with ":"'
@@ -31,6 +32,7 @@
 complete -c gallery-dl -x -l 'sleep-extractor' -d 'Number of seconds to wait before starting data extraction for an input URL'
 complete -c gallery-dl -x -l 'filesize-min' -d 'Do not download files smaller than SIZE (e.g. 500k or 2.5M)'
 complete -c gallery-dl -x -l 'filesize-max' -d 'Do not download files larger than SIZE (e.g. 500k or 2.5M)'
+complete -c gallery-dl -x -l 'chunk-size' -d 'Size of in-memory data chunks (default: 32k)'
 complete -c gallery-dl -l 'no-part' -d 'Do not use .part files'
 complete -c gallery-dl -l 'no-skip' -d 'Do not skip downloads; overwrite existing files'
 complete -c gallery-dl -l 'no-mtime' -d 'Do not set file modification times according to Last-Modified HTTP response headers'
diff -Nru gallery-dl-1.23.2/data/man/gallery-dl.1 gallery-dl-1.24.0/data/man/gallery-dl.1
--- gallery-dl-1.23.2/data/man/gallery-dl.1	2022-10-01 11:22:01.000000000 +0000
+++ gallery-dl-1.24.0/data/man/gallery-dl.1	2022-11-20 14:36:04.000000000 +0000
@@ -1,4 +1,4 @@
-.TH "GALLERY-DL" "1" "2022-10-01" "1.23.2" "gallery-dl Manual"
+.TH "GALLERY-DL" "1" "2022-11-20" "1.24.0" "gallery-dl Manual"
 .\" disable hyphenation
 .nh
 
@@ -41,6 +41,9 @@
 .B "\-\-source\-address" \f[I]IP\f[]
 Client-side IP address to bind to
 .TP
+.B "\-\-user\-agent" \f[I]UA\f[]
+User-Agent request header
+.TP
 .B "\-\-clear\-cache" \f[I]MODULE\f[]
 Delete cached login sessions, cookies, etc. for MODULE (ALL to delete everything)
 .TP
@@ -113,6 +116,9 @@
 .B "\-\-filesize\-max" \f[I]SIZE\f[]
 Do not download files larger than SIZE (e.g. 500k or 2.5M)
 .TP
+.B "\-\-chunk\-size" \f[I]SIZE\f[]
+Size of in-memory data chunks (default: 32k)
+.TP
 .B "\-\-no\-part" 
 Do not use .part files
 .TP
diff -Nru gallery-dl-1.23.2/data/man/gallery-dl.conf.5 gallery-dl-1.24.0/data/man/gallery-dl.conf.5
--- gallery-dl-1.23.2/data/man/gallery-dl.conf.5	2022-10-01 11:22:01.000000000 +0000
+++ gallery-dl-1.24.0/data/man/gallery-dl.conf.5	2022-11-20 14:36:04.000000000 +0000
@@ -1,4 +1,4 @@
-.TH "GALLERY-DL.CONF" "5" "2022-10-01" "1.23.2" "gallery-dl Manual"
+.TH "GALLERY-DL.CONF" "5" "2022-11-20" "1.24.0" "gallery-dl Manual"
 .\" disable hyphenation
 .nh
 .\" disable justification (adjust text to left margin only)
@@ -310,6 +310,18 @@
 * \f[I]"windows"\f[]: \f[I]". "\f[]
 
 
+.SS extractor.*.path-extended
+.IP "Type:" 6
+\f[I]bool\f[]
+
+.IP "Default:" 9
+\f[I]true\f[]
+
+.IP "Description:" 4
+On Windows, use \f[I]extended-length paths\f[]
+prefixed with \f[I]\\\\?\\\f[] to work around the 260 characters path length limit.
+
+
 .SS extractor.*.extension-map
 .IP "Type:" 6
 \f[I]object\f[]
@@ -437,8 +449,6 @@
 .br
 * \f[I]inkbunny\f[]
 .br
-* \f[I]instagram\f[]
-.br
 * \f[I]kemonoparty\f[]
 .br
 * \f[I]mangadex\f[]
@@ -603,6 +613,9 @@
 .IP "Description:" 4
 User-Agent header value to be used for HTTP requests.
 
+Setting this value to \f[I]"browser"\f[] will try to automatically detect
+and use the User-Agent used by the system's default browser.
+
 Note: This option has no effect on pixiv extractors,
 as these need specific values to function correctly.
 
@@ -612,7 +625,10 @@
 \f[I]string\f[]
 
 .IP "Default:" 9
-\f[I]"firefox"\f[] for \f[I]patreon\f[], \f[I]null\f[] everywhere else
+.br
+* \f[I]"firefox"\f[] for \f[I]patreon\f[], \f[I]mangapark\f[], and \f[I]mangasee\f[]
+.br
+* \f[I]null\f[] everywhere else
 
 .IP "Example:" 4
 .br
@@ -684,6 +700,23 @@
 to access the current file's filename as \f[I]"[gdl_path.filename}"\f[].
 
 
+.SS extractor.*.http-metadata
+.IP "Type:" 6
+\f[I]string\f[]
+
+.IP "Default:" 9
+\f[I]null\f[]
+
+.IP "Description:" 4
+Insert an \f[I]object\f[] containing a file's HTTP headers and
+\f[I]filename\f[], \f[I]extension\f[], and \f[I]date\f[] parsed from them
+into metadata dictionaries as the given name.
+
+For example, setting this option to \f[I]"gdl_http"\f[] would make it possible
+to access the current file's \f[I]Last-Modified\f[] header as \f[I]"{gdl_http[Last-Modified]}"\f[]
+and its parsed form as \f[I]"{gdl_http[date]}"\f[].
+
+
 .SS extractor.*.category-transfer
 .IP "Type:" 6
 \f[I]bool\f[]
@@ -1211,6 +1244,18 @@
 Use with caution.
 
 
+.SS extractor.deviantart.group
+.IP "Type:" 6
+\f[I]bool\f[]
+
+.IP "Default:" 9
+\f[I]true\f[]
+
+.IP "Description:" 4
+Check whether the profile name in a given URL
+belongs to a group or a regular user.
+
+
 .SS extractor.deviantart.include
 .IP "Type:" 6
 \f[I]string\f[] or \f[I]list\f[] of \f[I]strings\f[]
@@ -1694,17 +1739,15 @@
 \f[I]string\f[]
 
 .IP "Default:" 9
-\f[I]"auto"\f[]
+\f[I]"rest"\f[]
 
 .IP "Description:" 4
 Selects which API endpoints to use.
 
 .br
-* \f[I]"rest"\f[]: REST API - higher-resolution media, only usable when logged in
-.br
-* \f[I]"graphql"\f[]: GraphQL API - lower-resolution media, partially accessible when not logged in
+* \f[I]"rest"\f[]: REST API - higher-resolution media
 .br
-* \f[I]"auto"\f[]: Use REST API when logged in, GraphQL API otherwise
+* \f[I]"graphql"\f[]: GraphQL API - lower-resolution media
 
 
 .SS extractor.instagram.include
@@ -1722,8 +1765,12 @@
 when processing a user profile.
 
 Possible values are
-\f[I]"posts"\f[], \f[I]"reels"\f[], \f[I]"channel"\f[], \f[I]"tagged"\f[],
-\f[I]"stories"\f[], \f[I]"highlights"\f[].
+\f[I]"posts"\f[],
+\f[I]"reels"\f[],
+\f[I]"tagged"\f[],
+\f[I]"stories"\f[],
+\f[I]"highlights"\f[],
+\f[I]"avatar"\f[].
 
 You can use \f[I]"all"\f[] instead of listing all values separately.
 
@@ -1974,6 +2021,18 @@
 Also emit metadata for text-only posts without media content.
 
 
+.SS extractor.nana.favkey
+.IP "Type:" 6
+\f[I]string\f[]
+
+.IP "Default:" 9
+\f[I]null\f[]
+
+.IP "Description:" 4
+Your \f[I]Nana Favorite Key\f[],
+used to access your favorite archives.
+
+
 .SS extractor.newgrounds.flash
 .IP "Type:" 6
 \f[I]bool\f[]
@@ -2214,7 +2273,7 @@
 It is possible to use \f[I]"all"\f[] instead of listing all values separately.
 
 
-.SS extractor.pixiv.artworks.metadata
+.SS extractor.pixiv.metadata
 .IP "Type:" 6
 \f[I]bool\f[]
 
@@ -2610,6 +2669,19 @@
 Search posts for inline images and videos.
 
 
+.SS extractor.tumblr.offset
+.IP "Type:" 6
+\f[I]integer\f[]
+
+.IP "Default:" 9
+\f[I]0\f[]
+
+.IP "Description:" 4
+Custom \f[I]offset\f[] starting value when paginating over blog posts.
+
+Allows skipping over posts without having to waste API calls.
+
+
 .SS extractor.tumblr.original
 .IP "Type:" 6
 \f[I]bool\f[]
@@ -2678,6 +2750,29 @@
 You can use \f[I]"all"\f[] instead of listing all types separately.
 
 
+.SS extractor.tumblr.fallback-delay
+.IP "Type:" 6
+\f[I]float\f[]
+
+.IP "Default:" 9
+\f[I]120.0\f[]
+
+.IP "Description:" 4
+Number of seconds to wait between retries
+for fetching full-resolution images.
+
+
+.SS extractor.tumblr.fallback-retries
+.IP "Type:" 6
+\f[I]integer\f[]
+
+.IP "Default:" 9
+\f[I]2\f[]
+
+.IP "Description:" 4
+Number of retries for fetching full-resolution images.
+
+
 .SS extractor.twibooru.api-key
 .IP "Type:" 6
 \f[I]string\f[]
@@ -3028,6 +3123,32 @@
 See https://wallhaven.cc/help/api for more information.
 
 
+.SS extractor.wallhaven.include
+.IP "Type:" 6
+.br
+* \f[I]string\f[]
+.br
+* \f[I]list\f[] of \f[I]strings\f[]
+
+.IP "Default:" 9
+\f[I]"uploads"\f[]
+
+.IP "Example:" 4
+.br
+* "uploads,collections"
+.br
+* ["uploads", "collections"]
+
+.IP "Description:" 4
+A (comma-separated) list of subcategories to include
+when processing a user profile.
+
+Possible values are
+\f[I]"uploads"\f[], \f[I]"collections"\f[].
+
+It is possible to use \f[I]"all"\f[] instead of listing all values separately.
+
+
 .SS extractor.wallhaven.metadata
 .IP "Type:" 6
 \f[I]bool\f[]
@@ -3336,7 +3457,7 @@
 Any file smaller/larger than this limit will not be downloaded.
 
 Possible values are valid integer or floating-point numbers
-optionally followed by one of \f[I]k\f[], \f[I]m\f[]. \f[I]g\f[], \f[I]t\f[] or \f[I]p\f[].
+optionally followed by one of \f[I]k\f[], \f[I]m\f[]. \f[I]g\f[], \f[I]t\f[], or \f[I]p\f[].
 These suffixes are case-insensitive.
 
 
@@ -3414,7 +3535,7 @@
 Maximum download rate in bytes per second.
 
 Possible values are valid integer or floating-point numbers
-optionally followed by one of \f[I]k\f[], \f[I]m\f[]. \f[I]g\f[], \f[I]t\f[] or \f[I]p\f[].
+optionally followed by one of \f[I]k\f[], \f[I]m\f[]. \f[I]g\f[], \f[I]t\f[], or \f[I]p\f[].
 These suffixes are case-insensitive.
 
 
@@ -3474,9 +3595,31 @@
 \f[I]true\f[]
 
 .IP "Description:" 4
-Check the file headers of \f[I]jpg\f[], \f[I]png\f[], and \f[I]gif\f[] files
+Check file headers of downloaded files
 and adjust their filename extensions if they do not match.
 
+For example, this will change the filename extension (\f[I]{extension}\f[])
+of a file called \f[I]example.png\f[] from \f[I]png\f[] to \f[I]jpg\f[] when said file
+contains JPEG/JFIF data.
+
+
+.SS downloader.http.chunk-size
+.IP "Type:" 6
+\f[I]integer\f[] or \f[I]string\f[]
+
+.IP "Default:" 9
+\f[I]32768\f[]
+
+.IP "Example:" 4
+"50k", "0.8M"
+
+.IP "Description:" 4
+Number of bytes per downloaded chunk.
+
+Possible values are integer numbers
+optionally followed by one of \f[I]k\f[], \f[I]m\f[]. \f[I]g\f[], \f[I]t\f[], or \f[I]p\f[].
+These suffixes are case-insensitive.
+
 
 .SS downloader.http.headers
 .IP "Type:" 6
@@ -3928,6 +4071,9 @@
 * \f[I]"json"\f[]: write metadata using \f[I]json.dump()
 <https://docs.python.org/3/library/json.html#json.dump>\f[]
 .br
+* \f[I]"jsonl"\f[]: write metadata in \f[I]JSON Lines
+<https://jsonlines.org/>\f[] format
+.br
 * \f[I]"tags"\f[]: write \f[I]tags\f[] separated by newlines
 .br
 * \f[I]"custom"\f[]: write the result of applying \f[I]metadata.content-format\f[]
@@ -4031,6 +4177,8 @@
 \f[I]post\f[]
 When starting to download all files of a post,
 e.g. a Tweet on Twitter or a post on Patreon.
+\f[I]post-after\f[]
+After downloading all files of a post
 
 
 .SS metadata.fields
@@ -4082,6 +4230,48 @@
 Note: Only applies for \f[I]"mode": "custom"\f[].
 
 
+.SS metadata.open
+.IP "Type:" 6
+\f[I]string\f[]
+
+.IP "Defsult:" 4
+\f[I]"w"\f[]
+
+.IP "Description:" 4
+The \f[I]mode\f[] in which metadata files get opened.
+
+For example,
+use \f[I]"a"\f[] to append to a file's content
+or \f[I]"w"\f[] to truncate it.
+
+See the \f[I]mode\f[] parameter of \f[I]open()\f[] for further details.
+
+
+.SS metadata.private
+.IP "Type:" 6
+\f[I]bool\f[]
+
+.IP "Default:" 9
+\f[I]false\f[]
+
+.IP "Description:" 4
+Include private fields,
+i.e. fields whose name starts with an underscore.
+
+
+.SS metadata.encoding
+.IP "Type:" 6
+\f[I]string\f[]
+
+.IP "Defsult:" 4
+\f[I]"utf-8"\f[]
+
+.IP "Description:" 4
+Name of the encoding used to encode a file's content.
+
+See the \f[I]encoding\f[] parameter of \f[I]open()\f[] for further details.
+
+
 .SS metadata.archive
 .IP "Type:" 6
 \f[I]Path\f[]
diff -Nru gallery-dl-1.23.2/debian/changelog gallery-dl-1.24.0/debian/changelog
--- gallery-dl-1.23.2/debian/changelog	2022-10-06 07:35:41.000000000 +0000
+++ gallery-dl-1.24.0/debian/changelog	2022-11-23 02:56:11.000000000 +0000
@@ -1,12 +1,30 @@
-gallery-dl (1.23.2-1~bpo20.04.1) focal-backports; urgency=medium
+gallery-dl (1.24.0-1~bpo20.04.1) focal-backports; urgency=medium
 
   * No-change backport to focal.
 
- -- Unit 193 <unit193@ubuntu.com>  Thu, 06 Oct 2022 03:35:41 -0400
+ -- Unit 193 <unit193@ubuntu.com>  Tue, 22 Nov 2022 21:56:11 -0500
+
+gallery-dl (1.24.0-1) unstable; urgency=medium
+
+  * New upstream version 1.24.0.
+
+ -- Unit 193 <unit193@debian.org>  Tue, 22 Nov 2022 04:35:11 -0500
+
+gallery-dl (1.23.5-1) unstable; urgency=medium
+
+  * New upstream version 1.23.5.
+
+ -- Unit 193 <unit193@debian.org>  Tue, 01 Nov 2022 21:33:44 -0400
+
+gallery-dl (1.23.3-1) unstable; urgency=medium
+
+  * New upstream version 1.23.3.
+
+ -- Unit 193 <unit193@debian.org>  Mon, 17 Oct 2022 03:46:23 -0400
 
 gallery-dl (1.23.2-1) unstable; urgency=medium
 
-  * New upstream version 1.23.2
+  * New upstream version 1.23.2.
 
  -- Unit 193 <unit193@debian.org>  Mon, 03 Oct 2022 04:10:00 -0400
 
diff -Nru gallery-dl-1.23.2/docs/gallery-dl.conf gallery-dl-1.24.0/docs/gallery-dl.conf
--- gallery-dl-1.23.2/docs/gallery-dl.conf	2022-09-30 17:35:45.000000000 +0000
+++ gallery-dl-1.24.0/docs/gallery-dl.conf	2022-11-17 16:15:08.000000000 +0000
@@ -24,6 +24,8 @@
         "path-replace": "_",
         "path-remove": "\\u0000-\\u001f\\u007f",
         "path-strip": "auto",
+        "path-extended": true,
+
         "extension-map": {
             "jpeg": "jpg",
             "jpe" : "jpg",
@@ -71,10 +73,13 @@
         {
             "client-id": null,
             "client-secret": null,
+            "auto-watch": false,
+            "auto-unwatch": false,
             "comments": false,
             "extra": false,
             "flat": true,
             "folders": false,
+            "group": true,
             "include": "gallery",
             "journals": "html",
             "mature": true,
@@ -154,9 +159,8 @@
         },
         "instagram":
         {
-            "username": null,
-            "password": null,
-            "api": "auto",
+            "api": "rest",
+            "cookies": null,
             "include": "posts",
             "sleep-request": [6.0, 12.0],
             "videos": true
@@ -189,6 +193,10 @@
             "format": "original",
             "include": "art"
         },
+        "nana":
+        {
+            "favkey": null
+        },
         "nijie":
         {
             "username": null,
@@ -221,6 +229,7 @@
         {
             "refresh-token": null,
             "include": "artworks",
+            "metadata": false,
             "tags": "japanese",
             "ugoira": true
         },
@@ -288,6 +297,7 @@
             "external": false,
             "inline": true,
             "posts": "all",
+            "offset": 0,
             "original": true,
             "reblogs": true
         },
@@ -319,7 +329,8 @@
         "wallhaven":
         {
             "api-key": null,
-            "metadata": false
+            "metadata": false,
+            "include": "uploads"
         },
         "weasyl":
         {
@@ -370,6 +381,7 @@
         "http":
         {
             "adjust-extensions": true,
+            "chunk-size": 32768,
             "headers": null
         },
 
diff -Nru gallery-dl-1.23.2/docs/gallery-dl-example.conf gallery-dl-1.24.0/docs/gallery-dl-example.conf
--- gallery-dl-1.23.2/docs/gallery-dl-example.conf	2022-09-30 14:46:45.000000000 +0000
+++ gallery-dl-1.24.0/docs/gallery-dl-example.conf	2022-11-10 12:38:30.000000000 +0000
@@ -210,6 +210,19 @@
             "text-tweets": true
         },
 
+        "ytdl":
+        {
+            "#": "enable 'ytdl' extractor",
+            "#": "i.e. invoke ytdl on all otherwise unsupported input URLs",
+            "enabled": true,
+
+            "#": "use yt-dlp instead of youtube-dl",
+            "module": "yt_dlp",
+
+            "#": "load ytdl options from config file",
+            "config-file": "~/yt-dlp.conf"
+        },
+
         "mastodon":
         {
             "#": "add 'tabletop.social' as recognized mastodon instance",
diff -Nru gallery-dl-1.23.2/gallery_dl/config.py gallery-dl-1.24.0/gallery_dl/config.py
--- gallery-dl-1.23.2/gallery_dl/config.py	2022-05-27 13:20:33.000000000 +0000
+++ gallery-dl-1.24.0/gallery_dl/config.py	2022-11-18 12:33:19.000000000 +0000
@@ -21,6 +21,7 @@
 # internals
 
 _config = {}
+_files = []
 
 if util.WINDOWS:
     _default_configs = [
@@ -61,8 +62,8 @@
     else:
         parsefunc = json.load
 
-    for path in files or _default_configs:
-        path = util.expand_path(path)
+    for pathfmt in files or _default_configs:
+        path = util.expand_path(pathfmt)
         try:
             with open(path, encoding="utf-8") as file:
                 confdict = parsefunc(file)
@@ -79,6 +80,7 @@
                 _config.update(confdict)
             else:
                 util.combine_dict(_config, confdict)
+            _files.append(pathfmt)
 
 
 def clear():
diff -Nru gallery-dl-1.23.2/gallery_dl/cookies.py gallery-dl-1.24.0/gallery_dl/cookies.py
--- gallery-dl-1.23.2/gallery_dl/cookies.py	2022-06-11 13:30:11.000000000 +0000
+++ gallery-dl-1.24.0/gallery_dl/cookies.py	2022-11-18 12:12:14.000000000 +0000
@@ -263,7 +263,7 @@
 
     path = _find_most_recently_used_file(search_root, "Cookies")
     if path is None:
-        raise FileNotFoundError("Unable tp find {} cookies database in "
+        raise FileNotFoundError("Unable to find {} cookies database in "
                                 "'{}'".format(config["browser"], search_root))
 
     logger.debug("Extracting cookies from %s", path)
diff -Nru gallery-dl-1.23.2/gallery_dl/downloader/http.py gallery-dl-1.24.0/gallery_dl/downloader/http.py
--- gallery-dl-1.23.2/gallery_dl/downloader/http.py	2022-09-19 20:10:20.000000000 +0000
+++ gallery-dl-1.24.0/gallery_dl/downloader/http.py	2022-11-20 00:22:11.000000000 +0000
@@ -27,10 +27,11 @@
     def __init__(self, job):
         DownloaderBase.__init__(self, job)
         extractor = job.extractor
-        self.chunk_size = 16384
         self.downloading = False
 
         self.adjust_extension = self.config("adjust-extensions", True)
+        self.chunk_size = self.config("chunk-size", 32768)
+        self.metadata = extractor.config("http-metadata")
         self.progress = self.config("progress", 3.0)
         self.headers = self.config("headers")
         self.minsize = self.config("filesize-min")
@@ -55,6 +56,13 @@
                 self.log.warning(
                     "Invalid maximum file size (%r)", self.maxsize)
             self.maxsize = maxsize
+        if isinstance(self.chunk_size, str):
+            chunk_size = text.parse_bytes(self.chunk_size)
+            if not chunk_size:
+                self.log.warning(
+                    "Invalid chunk size (%r)", self.chunk_size)
+                chunk_size = 32768
+            self.chunk_size = chunk_size
         if self.rate:
             rate = text.parse_bytes(self.rate)
             if rate:
@@ -83,11 +91,12 @@
         tries = 0
         msg = ""
 
+        metadata = self.metadata
         kwdict = pathfmt.kwdict
         adjust_extension = kwdict.get(
             "_http_adjust_extension", self.adjust_extension)
 
-        if self.part:
+        if self.part and not metadata:
             pathfmt.part_enable(self.partdir)
 
         while True:
@@ -164,13 +173,6 @@
                     self.log.warning("Invalid response")
                     return False
 
-            # set missing filename extension from MIME type
-            if not pathfmt.extension:
-                pathfmt.set_extension(self._find_extension(response))
-                if pathfmt.exists():
-                    pathfmt.temppath = ""
-                    return True
-
             # check file size
             size = text.parse_int(size, None)
             if size is not None:
@@ -185,11 +187,33 @@
                         size, self.maxsize)
                     return False
 
+            build_path = False
+
+            # set missing filename extension from MIME type
+            if not pathfmt.extension:
+                pathfmt.set_extension(self._find_extension(response))
+                build_path = True
+
+            # set metadata from HTTP headers
+            if metadata:
+                kwdict[metadata] = util.extract_headers(response)
+                build_path = True
+
+            # build and check file path
+            if build_path:
+                pathfmt.build_path()
+                if pathfmt.exists():
+                    pathfmt.temppath = ""
+                    return True
+                if self.part and metadata:
+                    pathfmt.part_enable(self.partdir)
+                metadata = False
+
             content = response.iter_content(self.chunk_size)
 
             # check filename extension against file header
             if adjust_extension and not offset and \
-                    pathfmt.extension in FILE_SIGNATURES:
+                    pathfmt.extension in SIGNATURE_CHECKS:
                 try:
                     file_header = next(
                         content if response.raw.chunked
@@ -220,7 +244,7 @@
                     offset += len(file_header)
                 elif offset:
                     if adjust_extension and \
-                            pathfmt.extension in FILE_SIGNATURES:
+                            pathfmt.extension in SIGNATURE_CHECKS:
                         self._adjust_extension(pathfmt, fp.read(16))
                     fp.seek(offset)
 
@@ -250,42 +274,38 @@
         return True
 
     @staticmethod
-    def receive(fp, content, bytes_total, bytes_downloaded):
+    def receive(fp, content, bytes_total, bytes_start):
         write = fp.write
         for data in content:
             write(data)
 
-    def _receive_rate(self, fp, content, bytes_total, bytes_downloaded):
+    def _receive_rate(self, fp, content, bytes_total, bytes_start):
         rate = self.rate
-        progress = self.progress
-        bytes_start = bytes_downloaded
         write = fp.write
-        t1 = tstart = time.time()
+        progress = self.progress
+
+        bytes_downloaded = 0
+        time_start = time.time()
 
         for data in content:
-            write(data)
+            time_current = time.time()
+            time_elapsed = time_current - time_start
+            bytes_downloaded += len(data)
 
-            t2 = time.time()           # current time
-            elapsed = t2 - t1          # elapsed time
-            num_bytes = len(data)
+            write(data)
 
             if progress is not None:
-                bytes_downloaded += num_bytes
-                tdiff = t2 - tstart
-                if tdiff >= progress:
+                if time_elapsed >= progress:
                     self.out.progress(
-                        bytes_total, bytes_downloaded,
-                        int((bytes_downloaded - bytes_start) / tdiff),
+                        bytes_total,
+                        bytes_start + bytes_downloaded,
+                        int(bytes_downloaded / time_elapsed),
                     )
 
             if rate:
-                expected = num_bytes / rate  # expected elapsed time
-                if elapsed < expected:
-                    # sleep if less time elapsed than expected
-                    time.sleep(expected - elapsed)
-                    t2 = time.time()
-
-            t1 = t2
+                time_expected = bytes_downloaded / rate
+                if time_expected > time_elapsed:
+                    time.sleep(time_expected - time_elapsed)
 
     def _find_extension(self, response):
         """Get filename extension from MIME type"""
@@ -308,11 +328,11 @@
     @staticmethod
     def _adjust_extension(pathfmt, file_header):
         """Check filename extension against file header"""
-        sig = FILE_SIGNATURES[pathfmt.extension]
-        if not file_header.startswith(sig):
-            for ext, sig in FILE_SIGNATURES.items():
-                if file_header.startswith(sig):
+        if not SIGNATURE_CHECKS[pathfmt.extension](file_header):
+            for ext, check in SIGNATURE_CHECKS.items():
+                if check(file_header):
                     pathfmt.set_extension(ext)
+                    pathfmt.build_path()
                     return True
         return False
 
@@ -326,6 +346,7 @@
     "image/x-bmp"   : "bmp",
     "image/x-ms-bmp": "bmp",
     "image/webp"    : "webp",
+    "image/avif"    : "avif",
     "image/svg+xml" : "svg",
     "image/ico"     : "ico",
     "image/icon"    : "ico",
@@ -362,27 +383,33 @@
 }
 
 # https://en.wikipedia.org/wiki/List_of_file_signatures
-FILE_SIGNATURES = {
-    "jpg" : b"\xFF\xD8\xFF",
-    "png" : b"\x89PNG\r\n\x1A\n",
-    "gif" : (b"GIF87a", b"GIF89a"),
-    "bmp" : b"BM",
-    "webp": b"RIFF",
-    "svg" : b"<?xml",
-    "ico" : b"\x00\x00\x01\x00",
-    "cur" : b"\x00\x00\x02\x00",
-    "psd" : b"8BPS",
-    "webm": b"\x1A\x45\xDF\xA3",
-    "ogg" : b"OggS",
-    "wav" : b"RIFF",
-    "mp3" : (b"\xFF\xFB", b"\xFF\xF3", b"\xFF\xF2", b"ID3"),
-    "zip" : (b"PK\x03\x04", b"PK\x05\x06", b"PK\x07\x08"),
-    "rar" : b"\x52\x61\x72\x21\x1A\x07",
-    "7z"  : b"\x37\x7A\xBC\xAF\x27\x1C",
-    "pdf" : b"%PDF-",
-    "swf" : (b"CWS", b"FWS"),
+SIGNATURE_CHECKS = {
+    "jpg" : lambda s: s[0:3] == b"\xFF\xD8\xFF",
+    "png" : lambda s: s[0:8] == b"\x89PNG\r\n\x1A\n",
+    "gif" : lambda s: s[0:6] in (b"GIF87a", b"GIF89a"),
+    "bmp" : lambda s: s[0:2] == b"BM",
+    "webp": lambda s: (s[0:4] == b"RIFF" and
+                       s[8:12] == b"WEBP"),
+    "avif": lambda s: s[4:11] == b"ftypavi" and s[11] in b"fs",
+    "svg" : lambda s: s[0:5] == b"<?xml",
+    "ico" : lambda s: s[0:4] == b"\x00\x00\x01\x00",
+    "cur" : lambda s: s[0:4] == b"\x00\x00\x02\x00",
+    "psd" : lambda s: s[0:4] == b"8BPS",
+    "mp4" : lambda s: (s[4:8] == b"ftyp" and s[8:11] in (
+                       b"mp4", b"avc", b"iso", b"M4V")),
+    "webm": lambda s: s[0:4] == b"\x1A\x45\xDF\xA3",
+    "ogg" : lambda s: s[0:4] == b"OggS",
+    "wav" : lambda s: (s[0:4] == b"RIFF" and
+                       s[8:12] == b"WAVE"),
+    "mp3" : lambda s: (s[0:3] == b"ID3" or
+                       s[0:2] in (b"\xFF\xFB", b"\xFF\xF3", b"\xFF\xF2")),
+    "zip" : lambda s: s[0:4] in (b"PK\x03\x04", b"PK\x05\x06", b"PK\x07\x08"),
+    "rar" : lambda s: s[0:6] == b"Rar!\x1A\x07",
+    "7z"  : lambda s: s[0:6] == b"\x37\x7A\xBC\xAF\x27\x1C",
+    "pdf" : lambda s: s[0:5] == b"%PDF-",
+    "swf" : lambda s: s[0:3] in (b"CWS", b"FWS"),
     # check 'bin' files against all other file signatures
-    "bin" : b"\x00\x00\x00\x00\x00\x00\x00\x00",
+    "bin" : lambda s: False,
 }
 
 __downloader__ = HttpDownloader
diff -Nru gallery-dl-1.23.2/gallery_dl/downloader/ytdl.py gallery-dl-1.24.0/gallery_dl/downloader/ytdl.py
--- gallery-dl-1.23.2/gallery_dl/downloader/ytdl.py	2022-06-20 09:32:02.000000000 +0000
+++ gallery-dl-1.24.0/gallery_dl/downloader/ytdl.py	2022-11-10 12:38:30.000000000 +0000
@@ -98,6 +98,7 @@
                 pathfmt.realdirectory + filename)
         else:
             pathfmt.set_extension(info_dict["ext"])
+            pathfmt.build_path()
 
         if pathfmt.exists():
             pathfmt.temppath = ""
@@ -118,6 +119,7 @@
 
     def _download_playlist(self, ytdl_instance, pathfmt, info_dict):
         pathfmt.set_extension("%(playlist_index)s.%(ext)s")
+        pathfmt.build_path()
         self._set_outtmpl(ytdl_instance, pathfmt.realpath)
 
         for entry in info_dict["entries"]:
diff -Nru gallery-dl-1.23.2/gallery_dl/extractor/2chan.py gallery-dl-1.24.0/gallery_dl/extractor/2chan.py
--- gallery-dl-1.23.2/gallery_dl/extractor/2chan.py	2022-07-12 13:49:22.000000000 +0000
+++ gallery-dl-1.24.0/gallery_dl/extractor/2chan.py	2022-11-10 12:38:30.000000000 +0000
@@ -60,8 +60,8 @@
 
     def metadata(self, page):
         """Collect metadata for extractor-job"""
-        title = text.extract(page, "<title>", "</title>")[0]
-        title, _, boardname = title.rpartition(" - ")
+        title, _, boardname = text.extr(
+            page, "<title>", "</title>").rpartition(" - ")
         return {
             "server": self.server,
             "title": title,
@@ -72,8 +72,8 @@
 
     def posts(self, page):
         """Build a list of all post-objects"""
-        page = text.extract(
-            page, '<div class="thre"', '<div style="clear:left"></div>')[0]
+        page = text.extr(
+            page, '<div class="thre"', '<div style="clear:left"></div>')
         return [
             self.parse(post)
             for post in page.split('<table border=0>')
@@ -84,7 +84,7 @@
         data = self._extract_post(post)
         if data["name"]:
             data["name"] = data["name"].strip()
-        path = text.extract(post, '<a href="/', '"')[0]
+        path = text.extr(post, '<a href="/', '"')
         if path and not path.startswith("bin/jump"):
             self._extract_image(post, data)
             data["tim"], _, data["extension"] = data["filename"].partition(".")
diff -Nru gallery-dl-1.23.2/gallery_dl/extractor/2chen.py gallery-dl-1.24.0/gallery_dl/extractor/2chen.py
--- gallery-dl-1.23.2/gallery_dl/extractor/2chen.py	1970-01-01 00:00:00.000000000 +0000
+++ gallery-dl-1.24.0/gallery_dl/extractor/2chen.py	2022-11-08 16:10:24.000000000 +0000
@@ -0,0 +1,99 @@
+# -*- coding: utf-8 -*-
+
+# This program is free software; you can redistribute it and/or modify
+# it under the terms of the GNU General Public License version 2 as
+# published by the Free Software Foundation.
+
+"""Extractors for https://2chen.moe/"""
+
+from .common import Extractor, Message
+from .. import text
+
+
+class _2chenThreadExtractor(Extractor):
+    """Extractor for 2chen threads"""
+    category = "2chen"
+    subcategory = "thread"
+    directory_fmt = ("{category}", "{board}", "{thread} {title}")
+    filename_fmt = "{time} {filename}.{extension}"
+    archive_fmt = "{board}_{thread}_{hash}"
+    root = "https://2chen.moe"
+    pattern = r"(?:https?://)?2chen\.moe/([^/?#]+)/(\d+)"
+    test = (
+        ("https://2chen.moe/jp/303786", {
+            "count": ">= 10",
+        }),
+    )
+
+    def __init__(self, match):
+        Extractor.__init__(self, match)
+        self.board, self.thread = match.groups()
+
+    def items(self):
+        url = "{}/{}/{}".format(self.root, self.board, self.thread)
+        page = self.request(url, encoding="utf-8").text
+        data = self.metadata(page)
+        yield Message.Directory, data
+        for post in self.posts(page):
+            if not post["url"]:
+                continue
+            post.update(data)
+            post["url"] = self.root + post["url"]
+            post["time"] = text.parse_int(post["date"].timestamp())
+            yield Message.Url, post["url"], text.nameext_from_url(
+                post["filename"], post)
+
+    def metadata(self, page):
+        board, pos = text.extract(page, 'class="board">/', '/<')
+        title = text.extract(page, "<h3>", "</h3>", pos)[0]
+        return {
+            "board" : board,
+            "thread": self.thread,
+            "title" : text.unescape(title),
+        }
+
+    def posts(self, page):
+        """Return iterable with relevant posts"""
+        return map(self.parse, text.extract_iter(
+            page, 'class="glass media', '</article>'))
+
+    def parse(self, post):
+        extr = text.extract_from(post)
+        return {
+            "name"    : text.unescape(extr("<span>", "</span>")),
+            "date"    : text.parse_datetime(
+                extr("<time", "<").partition(">")[2],
+                "%d %b %Y (%a) %H:%M:%S"
+            ),
+            "no"      : extr('href="#p', '"'),
+            "url"     : extr('</span><a href="', '"'),
+            "filename": text.unescape(extr('download="', '"')),
+            "hash"    : extr('data-hash="', '"'),
+        }
+
+
+class _2chenBoardExtractor(Extractor):
+    """Extractor for 2chen boards"""
+    category = "2chen"
+    subcategory = "board"
+    root = "https://2chen.moe"
+    pattern = r"(?:https?://)?2chen\.moe/([^/?#]+)(?:/catalog)?/?$"
+    test = (
+        ("https://2chen.moe/co/", {
+            "pattern": _2chenThreadExtractor.pattern
+        }),
+        ("https://2chen.moe/co"),
+        ("https://2chen.moe/co/catalog")
+    )
+
+    def __init__(self, match):
+        Extractor.__init__(self, match)
+        self.board = match.group(1)
+
+    def items(self):
+        url = "{}/{}/catalog".format(self.root, self.board)
+        page = self.request(url).text
+        data = {"_extractor": _2chenThreadExtractor}
+        for thread in text.extract_iter(
+                page, '<figure><a href="', '"'):
+            yield Message.Queue, self.root + thread, data
diff -Nru gallery-dl-1.23.2/gallery_dl/extractor/35photo.py gallery-dl-1.24.0/gallery_dl/extractor/35photo.py
--- gallery-dl-1.23.2/gallery_dl/extractor/35photo.py	2022-02-01 23:09:19.000000000 +0000
+++ gallery-dl-1.24.0/gallery_dl/extractor/35photo.py	2022-11-10 12:38:30.000000000 +0000
@@ -1,6 +1,6 @@
 # -*- coding: utf-8 -*-
 
-# Copyright 2019-2021 Mike Fährmann
+# Copyright 2019-2022 Mike Fährmann
 #
 # This program is free software; you can redistribute it and/or modify
 # it under the terms of the GNU General Public License version 2 as
@@ -124,7 +124,7 @@
     def metadata(self):
         url = "{}/{}/".format(self.root, self.user)
         page = self.request(url).text
-        self.user_id = text.parse_int(text.extract(page, "/user_", ".xml")[0])
+        self.user_id = text.parse_int(text.extr(page, "/user_", ".xml"))
         return {
             "user": self.user,
             "user_id": self.user_id,
@@ -189,10 +189,10 @@
     def metadata(self):
         url = "{}/genre_{}{}".format(self.root, self.genre_id, self.new or "/")
         page = self.request(url).text
-        self.photo_ids = self._photo_ids(text.extract(
-            page, ' class="photo', '\n')[0])
+        self.photo_ids = self._photo_ids(text.extr(
+            page, ' class="photo', '\n'))
         return {
-            "genre": text.extract(page, " genre - ", ". ")[0],
+            "genre": text.extr(page, " genre - ", ". "),
             "genre_id": text.parse_int(self.genre_id),
         }
 
diff -Nru gallery-dl-1.23.2/gallery_dl/extractor/8chan.py gallery-dl-1.24.0/gallery_dl/extractor/8chan.py
--- gallery-dl-1.23.2/gallery_dl/extractor/8chan.py	1970-01-01 00:00:00.000000000 +0000
+++ gallery-dl-1.24.0/gallery_dl/extractor/8chan.py	2022-11-08 16:10:24.000000000 +0000
@@ -0,0 +1,172 @@
+# -*- coding: utf-8 -*-
+
+# Copyright 2022 Mike Fährmann
+#
+# This program is free software; you can redistribute it and/or modify
+# it under the terms of the GNU General Public License version 2 as
+# published by the Free Software Foundation.
+
+"""Extractors for https://8chan.moe/"""
+
+from .common import Extractor, Message
+from .. import text
+from ..cache import memcache
+from datetime import datetime, timedelta
+import itertools
+
+BASE_PATTERN = r"(?:https?://)?8chan\.(moe|se|cc)"
+
+
+class _8chanExtractor(Extractor):
+    """Base class for 8chan extractors"""
+    category = "8chan"
+    root = "https://8chan.moe"
+
+    def __init__(self, match):
+        self.root = "https://8chan." + match.group(1)
+        Extractor.__init__(self, match)
+
+    @memcache()
+    def _prepare_cookies(self):
+        # fetch captcha cookies
+        # (necessary to download without getting interrupted)
+        now = datetime.utcnow()
+        url = self.root + "/captcha.js"
+        params = {"d": now.strftime("%a %b %d %Y %H:%M:%S GMT+0000 (UTC)")}
+        self.request(url, params=params).content
+
+        # adjust cookies
+        # - remove 'expires' timestamp
+        # - move 'captchaexpiration' value forward by 1 month)
+        domain = self.root.rpartition("/")[2]
+        for cookie in self.session.cookies:
+            if cookie.domain.endswith(domain):
+                cookie.expires = None
+                if cookie.name == "captchaexpiration":
+                    cookie.value = (now + timedelta(30, 300)).strftime(
+                        "%a, %d %b %Y %H:%M:%S GMT")
+
+        return self.session.cookies
+
+
+class _8chanThreadExtractor(_8chanExtractor):
+    """Extractor for 8chan threads"""
+    subcategory = "thread"
+    directory_fmt = ("{category}", "{boardUri}",
+                     "{threadId} {subject[:50]}")
+    filename_fmt = "{postId}{num:?-//} {filename[:200]}.{extension}"
+    archive_fmt = "{boardUri}_{postId}_{num}"
+    pattern = BASE_PATTERN + r"/([^/?#]+)/res/(\d+)"
+    test = (
+        ("https://8chan.moe/vhs/res/4.html", {
+            "pattern": r"https://8chan\.moe/\.media/[0-9a-f]{64}\.\w+$",
+            "count": 14,
+            "keyword": {
+                "archived": False,
+                "autoSage": False,
+                "boardDescription": "Film and Cinema",
+                "boardMarkdown": None,
+                "boardName": "Movies",
+                "boardUri": "vhs",
+                "creation": r"re:\d{4}-\d{2}-\d{2}T\d{2}:\d{2}:\d{2}.\d{3}Z",
+                "cyclic": False,
+                "email": None,
+                "id": "re:^[0-9a-f]{6}$",
+                "locked": False,
+                "markdown": str,
+                "maxFileCount": 5,
+                "maxFileSize": "32.00 MB",
+                "maxMessageLength": 8001,
+                "message": str,
+                "mime": str,
+                "name": "Anonymous",
+                "num": int,
+                "originalName": str,
+                "path": r"re:/.media/[0-9a-f]{64}\.\w+$",
+                "pinned": False,
+                "postId": int,
+                "signedRole": None,
+                "size": int,
+                "threadId": 4,
+                "thumb": r"re:/.media/t_[0-9a-f]{64}$",
+                "uniquePosters": 9,
+                "usesCustomCss": True,
+                "usesCustomJs": False,
+                "wsPort": 8880,
+                "wssPort": 2087,
+            },
+        }),
+        ("https://8chan.se/vhs/res/4.html"),
+        ("https://8chan.cc/vhs/res/4.html"),
+    )
+
+    def __init__(self, match):
+        _8chanExtractor.__init__(self, match)
+        _, self.board, self.thread = match.groups()
+
+    def items(self):
+        # fetch thread data
+        url = "{}/{}/res/{}.".format(self.root, self.board, self.thread)
+        self.session.headers["Referer"] = url + "html"
+        thread = self.request(url + "json").json()
+        thread["postId"] = thread["threadId"]
+        thread["_http_headers"] = {"Referer": url + "html"}
+
+        try:
+            self.session.cookies = self._prepare_cookies()
+        except Exception as exc:
+            self.log.debug("Failed to fetch captcha cookies:  %s: %s",
+                           exc.__class__.__name__, exc, exc_info=True)
+
+        # download files
+        posts = thread.pop("posts", ())
+        yield Message.Directory, thread
+        for post in itertools.chain((thread,), posts):
+            files = post.pop("files", ())
+            if not files:
+                continue
+            thread.update(post)
+            for num, file in enumerate(files):
+                file.update(thread)
+                file["num"] = num
+                text.nameext_from_url(file["originalName"], file)
+                yield Message.Url, self.root + file["path"], file
+
+
+class _8chanBoardExtractor(_8chanExtractor):
+    """Extractor for 8chan boards"""
+    subcategory = "board"
+    pattern = BASE_PATTERN + r"/([^/?#]+)/(?:(\d+)\.html)?$"
+    test = (
+        ("https://8chan.moe/vhs/"),
+        ("https://8chan.moe/vhs/2.html", {
+            "pattern": _8chanThreadExtractor.pattern,
+            "count": 23,
+        }),
+        ("https://8chan.se/vhs/"),
+        ("https://8chan.cc/vhs/"),
+    )
+
+    def __init__(self, match):
+        _8chanExtractor.__init__(self, match)
+        _, self.board, self.page = match.groups()
+        self.session.headers["Referer"] = self.root + "/"
+
+    def items(self):
+        page = text.parse_int(self.page, 1)
+        url = "{}/{}/{}.json".format(self.root, self.board, page)
+        board = self.request(url).json()
+        threads = board["threads"]
+
+        while True:
+            for thread in threads:
+                thread["_extractor"] = _8chanThreadExtractor
+                url = "{}/{}/res/{}.html".format(
+                    self.root, self.board, thread["threadId"])
+                yield Message.Queue, url, thread
+
+            page += 1
+            if page > board["pageCount"]:
+                return
+            url = "{}/{}/{}.json".format(self.root, self.board, page)
+            threads = self.request(url).json()["threads"]
diff -Nru gallery-dl-1.23.2/gallery_dl/extractor/8kun.py gallery-dl-1.24.0/gallery_dl/extractor/8kun.py
--- gallery-dl-1.23.2/gallery_dl/extractor/8kun.py	2022-07-12 13:49:22.000000000 +0000
+++ gallery-dl-1.24.0/gallery_dl/extractor/8kun.py	1970-01-01 00:00:00.000000000 +0000
@@ -1,100 +0,0 @@
-# -*- coding: utf-8 -*-
-
-# Copyright 2020-2022 Mike Fährmann
-#
-# This program is free software; you can redistribute it and/or modify
-# it under the terms of the GNU General Public License version 2 as
-# published by the Free Software Foundation.
-
-"""Extractors for https://8kun.top/"""
-
-from .common import Extractor, Message
-from .. import text
-
-
-class _8kunThreadExtractor(Extractor):
-    """Extractor for 8kun threads"""
-    category = "8kun"
-    subcategory = "thread"
-    directory_fmt = ("{category}", "{board}", "{thread} {title}")
-    filename_fmt = "{time}{num:?-//} {filename}.{extension}"
-    archive_fmt = "{board}_{thread}_{tim}"
-    pattern = r"(?:https?://)?8kun\.top/([^/]+)/res/(\d+)"
-    test = (
-        ("https://8kun.top/test/res/65248.html", {
-            "pattern": r"https://media\.8kun\.top/file_store/\w{64}\.\w+",
-            "count": ">= 8",
-        }),
-        # old-style file URLs (#1101)
-        #  ("https://8kun.top/d/res/13258.html", {
-        #      "pattern": r"https://media\.8kun\.top/d/src/\d+(-\d)?\.\w+",
-        #      "range": "1-20",
-        #  }),
-    )
-
-    def __init__(self, match):
-        Extractor.__init__(self, match)
-        self.board, self.thread = match.groups()
-
-    def items(self):
-        url = "https://8kun.top/{}/res/{}.json".format(self.board, self.thread)
-        posts = self.request(url).json()["posts"]
-        title = posts[0].get("sub") or text.remove_html(posts[0]["com"])
-        process = self._process
-
-        data = {
-            "board" : self.board,
-            "thread": self.thread,
-            "title" : text.unescape(title)[:50],
-            "num"   : 0,
-        }
-
-        yield Message.Directory, data
-        for post in posts:
-            if "filename" in post:
-                yield process(post, data)
-                if "extra_files" in post:
-                    for post["num"], filedata in enumerate(
-                            post["extra_files"], 1):
-                        yield process(post, filedata)
-
-    @staticmethod
-    def _process(post, data):
-        post.update(data)
-        post["extension"] = post["ext"][1:]
-        tim = post["tim"]
-        url = ("https://media.8kun.top/" +
-               ("file_store/" if len(tim) > 16 else post["board"] + "/src/") +
-               tim + post["ext"])
-        return Message.Url, url, post
-
-
-class _8kunBoardExtractor(Extractor):
-    """Extractor for 8kun boards"""
-    category = "8kun"
-    subcategory = "board"
-    pattern = r"(?:https?://)?8kun\.top/([^/?#]+)/(?:index|\d+)\.html"
-    test = (
-        ("https://8kun.top/v/index.html", {
-            "pattern": _8kunThreadExtractor.pattern,
-            "count": ">= 100",
-        }),
-        ("https://8kun.top/v/2.html"),
-        ("https://8kun.top/v/index.html?PageSpeed=noscript"),
-    )
-
-    def __init__(self, match):
-        Extractor.__init__(self, match)
-        self.board = match.group(1)
-
-    def items(self):
-        url = "https://8kun.top/{}/threads.json".format(self.board)
-        threads = self.request(url).json()
-
-        for page in threads:
-            for thread in page["threads"]:
-                url = "https://8kun.top/{}/res/{}.html".format(
-                    self.board, thread["no"])
-                thread["page"] = page["page"]
-                thread["_extractor"] = _8kunThreadExtractor
-                yield Message.Queue, url, thread
diff -Nru gallery-dl-1.23.2/gallery_dl/extractor/8muses.py gallery-dl-1.24.0/gallery_dl/extractor/8muses.py
--- gallery-dl-1.23.2/gallery_dl/extractor/8muses.py	2022-07-12 13:49:22.000000000 +0000
+++ gallery-dl-1.24.0/gallery_dl/extractor/8muses.py	2022-11-10 12:38:30.000000000 +0000
@@ -76,9 +76,9 @@
         url = self.root + self.path + self.params
 
         while True:
-            data = self._unobfuscate(text.extract(
+            data = self._unobfuscate(text.extr(
                 self.request(url).text,
-                'id="ractive-public" type="text/plain">', '</script>')[0])
+                'id="ractive-public" type="text/plain">', '</script>'))
 
             images = data.get("pictures")
             if images:
diff -Nru gallery-dl-1.23.2/gallery_dl/extractor/artstation.py gallery-dl-1.24.0/gallery_dl/extractor/artstation.py
--- gallery-dl-1.23.2/gallery_dl/extractor/artstation.py	2022-09-30 14:46:45.000000000 +0000
+++ gallery-dl-1.24.0/gallery_dl/extractor/artstation.py	2022-11-10 12:38:30.000000000 +0000
@@ -41,8 +41,8 @@
 
                 if adict["has_embedded_player"] and self.external:
                     player = adict["player_embedded"]
-                    url = text.extract(player, 'src="', '"')[0] or \
-                        text.extract(player, "src='", "'")[0]
+                    url = (text.extr(player, 'src="', '"') or
+                           text.extr(player, "src='", "'"))
                     if url and not url.startswith(self.root):
                         asset["extension"] = None
                         yield Message.Url, "ytdl:" + url, asset
@@ -76,7 +76,12 @@
     def get_project_assets(self, project_id):
         """Return all assets associated with 'project_id'"""
         url = "{}/projects/{}.json".format(self.root, project_id)
-        data = self.request(url).json()
+
+        try:
+            data = self.request(url).json()
+        except exception.HttpError as exc:
+            self.log.warning(exc)
+            return
 
         data["title"] = text.unescape(data["title"])
         data["description"] = text.unescape(text.remove_html(
@@ -406,6 +411,10 @@
             "options": (("external", True),),
             "pattern": "ytdl:https://www.youtube.com/embed/JNFfJtwwrU0",
         }),
+        # 404 (#3016)
+        ("https://www.artstation.com/artwork/3q3mXB", {
+            "count": 0,
+        }),
         # alternate URL patterns
         ("https://sungchoi.artstation.com/projects/LQVJr"),
         ("https://artstn.co/p/LQVJr"),
@@ -419,7 +428,10 @@
     def metadata(self):
         self.assets = list(ArtstationExtractor.get_project_assets(
             self, self.project_id))
-        self.user = self.assets[0]["user"]["username"]
+        try:
+            self.user = self.assets[0]["user"]["username"]
+        except IndexError:
+            self.user = ""
         return ArtstationExtractor.metadata(self)
 
     def projects(self):
diff -Nru gallery-dl-1.23.2/gallery_dl/extractor/aryion.py gallery-dl-1.24.0/gallery_dl/extractor/aryion.py
--- gallery-dl-1.23.2/gallery_dl/extractor/aryion.py	2022-05-30 10:58:03.000000000 +0000
+++ gallery-dl-1.24.0/gallery_dl/extractor/aryion.py	2022-11-10 12:38:30.000000000 +0000
@@ -128,8 +128,7 @@
 
             # get filename from 'Content-Disposition' header
             cdis = headers["content-disposition"]
-            fname, _, ext = text.extract(
-                cdis, 'filename="', '"')[0].rpartition(".")
+            fname, _, ext = text.extr(cdis, 'filename="', '"').rpartition(".")
             if not fname:
                 fname, ext = ext, fname
 
diff -Nru gallery-dl-1.23.2/gallery_dl/extractor/bbc.py gallery-dl-1.24.0/gallery_dl/extractor/bbc.py
--- gallery-dl-1.23.2/gallery_dl/extractor/bbc.py	2022-02-01 23:09:19.000000000 +0000
+++ gallery-dl-1.24.0/gallery_dl/extractor/bbc.py	2022-11-10 12:38:30.000000000 +0000
@@ -38,8 +38,8 @@
     )
 
     def metadata(self, page):
-        data = json.loads(text.extract(
-            page, '<script type="application/ld+json">', '</script>')[0])
+        data = json.loads(text.extr(
+            page, '<script type="application/ld+json">', '</script>'))
         return {
             "programme": self.gallery_url.split("/")[4],
             "path": list(util.unique_sequence(
diff -Nru gallery-dl-1.23.2/gallery_dl/extractor/bcy.py gallery-dl-1.24.0/gallery_dl/extractor/bcy.py
--- gallery-dl-1.23.2/gallery_dl/extractor/bcy.py	2022-05-03 10:22:33.000000000 +0000
+++ gallery-dl-1.24.0/gallery_dl/extractor/bcy.py	2022-11-10 12:38:30.000000000 +0000
@@ -1,6 +1,6 @@
 # -*- coding: utf-8 -*-
 
-# Copyright 2020-2021 Mike Fährmann
+# Copyright 2020-2022 Mike Fährmann
 #
 # This program is free software; you can redistribute it and/or modify
 # it under the terms of the GNU General Public License version 2 as
@@ -25,9 +25,12 @@
     def __init__(self, match):
         Extractor.__init__(self, match)
         self.item_id = match.group(1)
+        self.session.headers["Referer"] = self.root + "/"
 
     def items(self):
-        sub = re.compile(r"^https?://p\d+-bcy\.byteimg\.com/img/banciyuan").sub
+        sub = re.compile(r"^https?://p\d+-bcy"
+                         r"(?:-sign\.bcyimg\.com|\.byteimg\.com/img)"
+                         r"/banciyuan").sub
         iroot = "https://img-bcy-qn.pstatp.com"
         noop = self.config("noop")
 
@@ -64,19 +67,18 @@
                 url = image["path"].partition("~")[0]
                 text.nameext_from_url(url, data)
 
+                # full-resolution image without watermark
                 if data["extension"]:
                     if not url.startswith(iroot):
                         url = sub(iroot, url)
                     data["filter"] = ""
                     yield Message.Url, url, data
 
+                # watermarked image & low quality noop filter
                 else:
-                    if not multi:
-                        if len(post["multi"]) < len(post["image_list"]):
-                            multi = self._data_from_post(post["item_id"])
-                            multi = multi["post_data"]["multi"]
-                        else:
-                            multi = post["multi"]
+                    if multi is None:
+                        multi = self._data_from_post(
+                            post["item_id"])["post_data"]["multi"]
                     image = multi[data["num"] - 1]
 
                     if image["origin"]:
@@ -95,7 +97,7 @@
         url = "{}/item/detail/{}".format(self.root, post_id)
         page = self.request(url, notfound="post").text
         return json.loads(
-            text.extract(page, 'JSON.parse("', '");')[0]
+            text.extr(page, 'JSON.parse("', '");')
             .replace('\\\\u002F', '/')
             .replace('\\"', '"')
         )["detail"]
@@ -111,8 +113,8 @@
             "count": ">= 20",
         }),
         ("https://bcy.net/u/109282764041", {
-            "pattern": r"https://p\d-bcy.byteimg.com/img/banciyuan/[0-9a-f]+"
-                       r"~tplv-banciyuan-logo-v3:.+\.image",
+            "pattern": r"https://p\d-bcy-sign\.bcyimg\.com/banciyuan/[0-9a-f]+"
+                       r"~tplv-bcyx-yuan-logo-v1:.+\.image",
             "range": "1-25",
             "count": 25,
         }),
@@ -171,13 +173,13 @@
         }),
         # only watermarked images available
         ("https://bcy.net/item/detail/6950136331708144648", {
-            "pattern": r"https://p\d-bcy.byteimg.com/img/banciyuan/[0-9a-f]+"
-                       r"~tplv-banciyuan-logo-v3:.+\.image",
-            "count": 8,
+            "pattern": r"https://p\d-bcy-sign\.bcyimg\.com/banciyuan/[0-9a-f]+"
+                       r"~tplv-bcyx-yuan-logo-v1:.+\.image",
+            "count": 10,
             "keyword": {"filter": "watermark"},
         }),
         # deleted
-        ("https://bcy.net/item/detail/6780546160802143236", {
+        ("https://bcy.net/item/detail/6780546160802143237", {
             "exception": exception.NotFoundError,
             "count": 0,
         }),
diff -Nru gallery-dl-1.23.2/gallery_dl/extractor/behance.py gallery-dl-1.24.0/gallery_dl/extractor/behance.py
--- gallery-dl-1.23.2/gallery_dl/extractor/behance.py	2022-05-03 10:22:33.000000000 +0000
+++ gallery-dl-1.24.0/gallery_dl/extractor/behance.py	2022-11-10 12:38:30.000000000 +0000
@@ -119,8 +119,8 @@
         }
         page = self.request(url, cookies=cookies).text
 
-        data = json.loads(text.extract(
-            page, 'id="beconfig-store_state">', '</script>')[0])
+        data = json.loads(text.extr(
+            page, 'id="beconfig-store_state">', '</script>'))
         return self._update(data["project"]["project"])
 
     def get_images(self, data):
@@ -137,7 +137,7 @@
 
             elif mtype == "video":
                 page = self.request(module["src"]).text
-                url = text.extract(page, '<source src="', '"')[0]
+                url = text.extr(page, '<source src="', '"')
                 if text.ext_from_url(url) == "m3u8":
                     url = "ytdl:" + url
                 append((url, module))
@@ -150,8 +150,7 @@
             elif mtype == "embed":
                 embed = module.get("original_embed") or module.get("embed")
                 if embed:
-                    url = "ytdl:" + text.extract(embed, 'src="', '"')[0]
-                    append((url, module))
+                    append(("ytdl:" + text.extr(embed, 'src="', '"'), module))
 
         return result
 
diff -Nru gallery-dl-1.23.2/gallery_dl/extractor/blogger.py gallery-dl-1.24.0/gallery_dl/extractor/blogger.py
--- gallery-dl-1.23.2/gallery_dl/extractor/blogger.py	2022-09-30 14:46:45.000000000 +0000
+++ gallery-dl-1.24.0/gallery_dl/extractor/blogger.py	2022-11-10 12:38:30.000000000 +0000
@@ -61,8 +61,8 @@
                 page = self.request(post["url"]).text
                 for url in findall_video(page):
                     page = self.request(url).text
-                    video_config = json.loads(text.extract(
-                        page, 'var VIDEO_CONFIG =', '\n')[0])
+                    video_config = json.loads(text.extr(
+                        page, 'var VIDEO_CONFIG =', '\n'))
                     files.append(max(
                         video_config["streams"],
                         key=lambda x: x["format_id"],
diff -Nru gallery-dl-1.23.2/gallery_dl/extractor/booru.py gallery-dl-1.24.0/gallery_dl/extractor/booru.py
--- gallery-dl-1.23.2/gallery_dl/extractor/booru.py	2022-05-03 10:22:33.000000000 +0000
+++ gallery-dl-1.24.0/gallery_dl/extractor/booru.py	2022-11-10 12:38:30.000000000 +0000
@@ -25,6 +25,7 @@
         data = self.metadata()
         tags = self.config("tags", False)
         notes = self.config("notes", False)
+        fetch_html = tags or notes
 
         for post in self.posts():
             try:
@@ -36,11 +37,13 @@
                                "(md5: %s)", post.get("id"), post.get("md5"))
                 continue
 
-            page_html = None
-            if tags:
-                page_html = self._extended_tags(post)
-            if notes:
-                self._notes(post, page_html)
+            if fetch_html:
+                html = self._html(post)
+                if tags:
+                    self._tags(post, html)
+                if notes:
+                    self._notes(post, html)
+
             text.nameext_from_url(url, post)
             post.update(data)
             self._prepare(post)
@@ -67,16 +70,13 @@
     _file_url = operator.itemgetter("file_url")
 
     def _prepare(self, post):
-        """Prepare the 'post's metadata"""
+        """Prepare a 'post's metadata"""
 
-    def _extended_tags(self, post, page=None):
-        """Generate extended tag information
+    def _html(self, post):
+        """Return HTML content of a post"""
 
-        The return value of this function will be
-        passed to the _notes function as the page parameter.
-        This makes it possible to reuse the same HTML both for
-        extracting tags and notes.
-        """
+    def _tags(self, post, page):
+        """Extract extended tag metadata"""
 
-    def _notes(self, post, page=None):
-        """Generate information about notes"""
+    def _notes(self, post, page):
+        """Extract notes metadata"""
diff -Nru gallery-dl-1.23.2/gallery_dl/extractor/bunkr.py gallery-dl-1.24.0/gallery_dl/extractor/bunkr.py
--- gallery-dl-1.23.2/gallery_dl/extractor/bunkr.py	2022-09-30 14:46:45.000000000 +0000
+++ gallery-dl-1.24.0/gallery_dl/extractor/bunkr.py	2022-11-10 12:38:30.000000000 +0000
@@ -68,9 +68,9 @@
         url = self.root + "/a/" + self.album_id
 
         try:
-            data = json.loads(text.extract(
+            data = json.loads(text.extr(
                 self.request(url).text,
-                'id="__NEXT_DATA__" type="application/json">', '<')[0])
+                'id="__NEXT_DATA__" type="application/json">', '<'))
             album = data["props"]["pageProps"]["album"]
             files = album["files"]
         except Exception as exc:
diff -Nru gallery-dl-1.23.2/gallery_dl/extractor/common.py gallery-dl-1.24.0/gallery_dl/extractor/common.py
--- gallery-dl-1.23.2/gallery_dl/extractor/common.py	2022-09-30 14:46:45.000000000 +0000
+++ gallery-dl-1.24.0/gallery_dl/extractor/common.py	2022-11-15 11:32:45.000000000 +0000
@@ -20,7 +20,7 @@
 import threading
 from requests.adapters import HTTPAdapter
 from .message import Message
-from .. import config, text, util, exception
+from .. import config, text, util, cache, exception
 
 
 class Extractor():
@@ -122,8 +122,7 @@
             seconds = (self._interval() -
                        (time.time() - Extractor.request_timestamp))
             if seconds > 0.0:
-                self.log.debug("Sleeping for %.5s seconds", seconds)
-                time.sleep(seconds)
+                self.sleep(seconds, "request")
 
         while True:
             try:
@@ -150,14 +149,13 @@
 
                 msg = "'{} {}' for '{}'".format(code, response.reason, url)
                 server = response.headers.get("Server")
-                if server and server.startswith("cloudflare"):
-                    if code == 503 and \
-                            (b"_cf_chl_opt" in response.content or
-                             b"jschl-answer" in response.content):
+                if server and server.startswith("cloudflare") and \
+                        code in (403, 503):
+                    content = response.content
+                    if b"_cf_chl_opt" in content or b"jschl-answer" in content:
                         self.log.warning("Cloudflare IUAM challenge")
                         break
-                    if code == 403 and \
-                            b'name="captcha-bypass"' in response.content:
+                    if b'name="captcha-bypass"' in content:
                         self.log.warning("Cloudflare CAPTCHA")
                         break
                 if code < 500 and code != 429 and code != 430:
@@ -169,8 +167,9 @@
             self.log.debug("%s (%s/%s)", msg, tries, retries+1)
             if tries > retries:
                 break
-            time.sleep(
-                max(tries, self._interval()) if self._interval else tries)
+            self.sleep(
+                max(tries, self._interval()) if self._interval else tries,
+                "retry")
             tries += 1
 
         raise exception.HttpError(msg, response)
@@ -202,6 +201,11 @@
             self.log.info("Waiting until %s for %s.", isotime, reason)
         time.sleep(seconds)
 
+    def sleep(self, seconds, reason):
+        self.log.debug("Sleeping %.2f seconds (%s)",
+                       seconds, reason)
+        time.sleep(seconds)
+
     def _get_auth_info(self):
         """Return authentication information as (username, password) tuple"""
         username = self.config("username")
@@ -258,9 +262,13 @@
                             ssl.OP_NO_TLSv1 | ssl.OP_NO_TLSv1_1)
             ssl_ciphers = SSL_CIPHERS[browser]
         else:
-            headers["User-Agent"] = self.config("user-agent", (
-                "Mozilla/5.0 (Windows NT 10.0; Win64; x64; "
-                "rv:102.0) Gecko/20100101 Firefox/102.0"))
+            useragent = self.config("user-agent")
+            if useragent is None:
+                useragent = ("Mozilla/5.0 (Windows NT 10.0; Win64; x64; "
+                             "rv:102.0) Gecko/20100101 Firefox/102.0")
+            elif useragent == "browser":
+                useragent = _browser_useragent()
+            headers["User-Agent"] = useragent
             headers["Accept"] = "*/*"
             headers["Accept-Language"] = "en-US,en;q=0.5"
 
@@ -720,6 +728,36 @@
     return adapter
 
 
+@cache.cache(maxage=86400)
+def _browser_useragent():
+    """Get User-Agent header from default browser"""
+    import webbrowser
+    import socket
+
+    server = socket.socket(socket.AF_INET, socket.SOCK_STREAM)
+    server.setsockopt(socket.SOL_SOCKET, socket.SO_REUSEADDR, 1)
+    server.bind(("127.0.0.1", 6414))
+    server.listen(1)
+
+    webbrowser.open("http://127.0.0.1:6414/user-agent")
+
+    client = server.accept()[0]
+    server.close()
+
+    for line in client.recv(1024).split(b"\r\n"):
+        key, _, value = line.partition(b":")
+        if key.strip().lower() == b"user-agent":
+            useragent = value.strip()
+            break
+    else:
+        useragent = b""
+
+    client.send(b"HTTP/1.1 200 OK\r\n\r\n" + useragent)
+    client.close()
+
+    return useragent.decode()
+
+
 _adapter_cache = {}
 _browser_cookies = {}
 
diff -Nru gallery-dl-1.23.2/gallery_dl/extractor/danbooru.py gallery-dl-1.24.0/gallery_dl/extractor/danbooru.py
--- gallery-dl-1.23.2/gallery_dl/extractor/danbooru.py	2022-08-27 18:29:11.000000000 +0000
+++ gallery-dl-1.24.0/gallery_dl/extractor/danbooru.py	2022-11-08 16:10:24.000000000 +0000
@@ -88,10 +88,7 @@
 
             if post["extension"] == "zip":
                 if self.ugoira:
-                    post["frames"] = self.request(
-                        "{}/posts/{}.json?only=pixiv_ugoira_frame_data".format(
-                            self.root, post["id"])
-                    ).json()["pixiv_ugoira_frame_data"]["data"]
+                    post["frames"] = self._ugoira_frames(post)
                     post["_http_adjust_extension"] = False
                 else:
                     url = post["large_file_url"]
@@ -105,6 +102,9 @@
                 resp = self.request(template.format(self.root, post["id"]))
                 post.update(resp.json())
 
+            if url[0] == "/":
+                url = self.root + url
+
             post.update(data)
             yield Message.Directory, post
             yield Message.Url, url, post
@@ -139,6 +139,18 @@
                 else:
                     return
 
+    def _ugoira_frames(self, post):
+        data = self.request("{}/posts/{}.json?only=media_metadata".format(
+            self.root, post["id"])
+        ).json()["media_metadata"]["metadata"]
+
+        ext = data["ZIP:ZipFileName"].rpartition(".")[2]
+        print(post["id"], ext)
+        fmt = ("{:>06}." + ext).format
+        delays = data["Ugoira:FrameDelays"]
+        return [{"file": fmt(index), "delay": delay}
+                for index, delay in enumerate(delays)]
+
 
 INSTANCES = {
     "danbooru": {
@@ -161,6 +173,10 @@
         "pattern": r"booru\.allthefallen\.moe",
         "page-limit": 5000,
     },
+    "aibooru": {
+        "root": None,
+        "pattern": r"(?:safe.)?aibooru\.online",
+    }
 }
 
 BASE_PATTERN = DanbooruExtractor.update(INSTANCES)
@@ -193,10 +209,16 @@
         ("https://booru.allthefallen.moe/posts?tags=yume_shokunin", {
             "count": 12,
         }),
+        ("https://aibooru.online/posts?tags=center_frills&z=1", {
+            "pattern": r"https://aibooru\.online/data/original"
+                       r"/[0-9a-f]{2}/[0-9a-f]{2}/[0-9a-f]{32}\.\w+",
+            "count": ">= 3",
+        }),
         ("https://hijiribe.donmai.us/posts?tags=bonocho"),
         ("https://sonohara.donmai.us/posts?tags=bonocho"),
         ("https://safebooru.donmai.us/posts?tags=bonocho"),
         ("https://e926.net/posts?tags=anry"),
+        ("https://safe.aibooru.online/posts?tags=center_frills"),
     )
 
     def __init__(self, match):
@@ -229,6 +251,7 @@
             "url": "902549ffcdb00fe033c3f63e12bc3cb95c5fd8d5",
             "count": 6,
         }),
+        ("https://aibooru.online/pools/1"),
         ("https://danbooru.donmai.us/pool/show/7659"),
         ("https://e621.net/pool/show/73"),
     )
@@ -291,6 +314,9 @@
         ("https://booru.allthefallen.moe/posts/22", {
             "content": "21dda68e1d7e0a554078e62923f537d8e895cac8",
         }),
+        ("https://aibooru.online/posts/1", {
+            "content": "54d548743cd67799a62c77cbae97cfa0fec1b7e9",
+        }),
         ("https://danbooru.donmai.us/post/show/294929"),
         ("https://e621.net/post/show/535"),
     )
@@ -325,6 +351,7 @@
             "count": ">= 70",
         }),
         ("https://booru.allthefallen.moe/explore/posts/popular"),
+        ("https://aibooru.online/explore/posts/popular"),
     )
 
     def __init__(self, match):
diff -Nru gallery-dl-1.23.2/gallery_dl/extractor/deviantart.py gallery-dl-1.24.0/gallery_dl/extractor/deviantart.py
--- gallery-dl-1.23.2/gallery_dl/extractor/deviantart.py	2022-09-30 14:46:45.000000000 +0000
+++ gallery-dl-1.24.0/gallery_dl/extractor/deviantart.py	2022-11-10 12:38:30.000000000 +0000
@@ -72,7 +72,7 @@
     def items(self):
         self.api = DeviantartOAuthAPI(self)
 
-        if self.user:
+        if self.user and self.config("group", True):
             profile = self.api.user_profile(self.user)
             self.group = not profile
             if self.group:
@@ -603,22 +603,22 @@
         page = self._limited_request(url).text
 
         if stash_id[0] == "0":
-            uuid = text.extract(page, '//deviation/', '"')[0]
+            uuid = text.extr(page, '//deviation/', '"')
             if uuid:
                 deviation = self.api.deviation(uuid)
-                deviation["index"] = text.parse_int(text.extract(
-                    page, 'gmi-deviationid="', '"')[0])
+                deviation["index"] = text.parse_int(text.extr(
+                    page, 'gmi-deviationid="', '"'))
                 yield deviation
                 return
 
         for item in text.extract_iter(
                 page, 'class="stash-thumb-container', '</div>'):
-            url = text.extract(item, '<a href="', '"')[0]
+            url = text.extr(item, '<a href="', '"')
 
             if url:
                 stash_id = url.rpartition("/")[2]
             else:
-                stash_id = text.extract(item, 'gmi-stashid="', '"')[0]
+                stash_id = text.extr(item, 'gmi-stashid="', '"')
                 stash_id = "2" + util.bencode(text.parse_int(
                     stash_id), "0123456789abcdefghijklmnopqrstuvwxyz")
 
@@ -938,11 +938,11 @@
     def deviations(self):
         url = "{}/{}/{}/{}".format(
             self.root, self.user, self.type, self.deviation_id)
-        appurl = text.extract(self._limited_request(url).text,
-                              'property="da:appurl" content="', '"')[0]
-        if not appurl:
+        uuid = text.extract(self._limited_request(url).text,
+                            '"deviationUuid\\":\\"', '\\')[0]
+        if not uuid:
             raise exception.NotFoundError("deviation")
-        return (self.api.deviation(appurl.rpartition("/")[2]),)
+        return (self.api.deviation(uuid),)
 
 
 class DeviantartScrapsExtractor(DeviantartExtractor):
@@ -960,9 +960,15 @@
     )
     cookiedomain = ".deviantart.com"
     cookienames = ("auth", "auth_secure", "userinfo")
+    _warning = True
 
     def deviations(self):
         eclipse_api = DeviantartEclipseAPI(self)
+        if self._warning:
+            DeviantartScrapsExtractor._warning = False
+            if not self._check_cookies(self.cookienames):
+                self.log.warning(
+                    "No session cookies set: Unable to fetch mature scraps.")
 
         for obj in eclipse_api.gallery_scraps(self.user, self.offset):
             deviation = obj["deviation"]
@@ -1478,8 +1484,8 @@
     def _fetch_csrf_token(self, page=None):
         if page is None:
             page = self.request(self.extractor.root + "/").text
-        self.csrf_token = token = text.extract(
-            page, "window.__CSRF_TOKEN__ = '", "'")[0]
+        self.csrf_token = token = text.extr(
+            page, "window.__CSRF_TOKEN__ = '", "'")
         return token
 
 
diff -Nru gallery-dl-1.23.2/gallery_dl/extractor/directlink.py gallery-dl-1.24.0/gallery_dl/extractor/directlink.py
--- gallery-dl-1.23.2/gallery_dl/extractor/directlink.py	2022-09-24 10:13:13.000000000 +0000
+++ gallery-dl-1.24.0/gallery_dl/extractor/directlink.py	2022-11-08 16:10:24.000000000 +0000
@@ -1,6 +1,6 @@
 # -*- coding: utf-8 -*-
 
-# Copyright 2017-2021 Mike Fährmann
+# Copyright 2017-2022 Mike Fährmann
 #
 # This program is free software; you can redistribute it and/or modify
 # it under the terms of the GNU General Public License version 2 as
@@ -19,7 +19,7 @@
     archive_fmt = filename_fmt
     pattern = (r"(?i)https?://(?P<domain>[^/?#]+)/(?P<path>[^?#]+\."
                r"(?:jpe?g|jpe|png|gif|web[mp]|mp4|mkv|og[gmv]|opus))"
-               r"(?:\?(?P<query>[^/?#]*))?(?:#(?P<fragment>.*))?$")
+               r"(?:\?(?P<query>[^#]*))?(?:#(?P<fragment>.*))?$")
     test = (
         (("https://en.wikipedia.org/static/images/project-logos/enwiki.png"), {
             "url": "18c5d00077332e98e53be9fed2ee4be66154b88d",
@@ -31,9 +31,9 @@
             "keyword": "29dad729c40fb09349f83edafa498dba1297464a",
         }),
         # more complex example
-        ("https://example.org/path/to/file.webm?que=1&ry=2#fragment", {
-            "url": "114b8f1415cc224b0f26488ccd4c2e7ce9136622",
-            "keyword": "06014abd503e3b2b58aa286f9bdcefdd2ae336c0",
+        ("https://example.org/path/to/file.webm?que=1?&ry=2/#fragment", {
+            "url": "6fb1061390f8aada3db01cb24b51797c7ee42b31",
+            "keyword": "3d7abc31d45ba324e59bc599c3b4862452d5f29c",
         }),
         # percent-encoded characters
         ("https://example.org/%27%3C%23/%23%3E%27.jpg?key=%3C%26%3E", {
diff -Nru gallery-dl-1.23.2/gallery_dl/extractor/dynastyscans.py gallery-dl-1.24.0/gallery_dl/extractor/dynastyscans.py
--- gallery-dl-1.23.2/gallery_dl/extractor/dynastyscans.py	2022-05-03 10:22:33.000000000 +0000
+++ gallery-dl-1.24.0/gallery_dl/extractor/dynastyscans.py	2022-11-10 12:38:30.000000000 +0000
@@ -30,7 +30,7 @@
         src = extr("class='btn-group'>", "</div>")
         url = extr(' src="', '"')
 
-        src = text.extract(src, 'href="', '"')[0] if "Source<" in src else ""
+        src = text.extr(src, 'href="', '"') if "Source<" in src else ""
 
         return {
             "url"     : self.root + url,
@@ -75,7 +75,7 @@
             "title"   : text.unescape(match.group(4) or ""),
             "author"  : text.remove_html(author),
             "group"   : (text.remove_html(group) or
-                         text.extract(group, ' alt="', '"')[0] or ""),
+                         text.extr(group, ' alt="', '"')),
             "date"    : text.parse_datetime(extr(
                 '"icon-calendar"></i> ', '<'), "%b %d, %Y"),
             "lang"    : "en",
@@ -83,7 +83,7 @@
         }
 
     def images(self, page):
-        data = text.extract(page, "var pages = ", ";\n")[0]
+        data = text.extr(page, "var pages = ", ";\n")
         return [
             (self.root + img["image"], None)
             for img in json.loads(data)
diff -Nru gallery-dl-1.23.2/gallery_dl/extractor/erome.py gallery-dl-1.24.0/gallery_dl/extractor/erome.py
--- gallery-dl-1.23.2/gallery_dl/extractor/erome.py	2022-09-19 20:55:23.000000000 +0000
+++ gallery-dl-1.24.0/gallery_dl/extractor/erome.py	2022-11-10 12:38:30.000000000 +0000
@@ -55,8 +55,8 @@
             yield Message.Directory, data
             groups = page.split('<div class="media-group"')
             for data["num"], group in enumerate(util.advance(groups, 1), 1):
-                url = (text.extract(group, '<source src="', '"')[0] or
-                       text.extract(group, 'data-src="', '"')[0])
+                url = (text.extr(group, '<source src="', '"') or
+                       text.extr(group, 'data-src="', '"'))
                 if url:
                     yield Message.Url, url, text.nameext_from_url(url, data)
 
diff -Nru gallery-dl-1.23.2/gallery_dl/extractor/exhentai.py gallery-dl-1.24.0/gallery_dl/extractor/exhentai.py
--- gallery-dl-1.23.2/gallery_dl/extractor/exhentai.py	2022-09-30 14:46:45.000000000 +0000
+++ gallery-dl-1.24.0/gallery_dl/extractor/exhentai.py	2022-11-10 12:38:30.000000000 +0000
@@ -185,7 +185,7 @@
 
         if self.gallery_token:
             gpage = self._gallery_page()
-            self.image_token = text.extract(gpage, 'hentai.org/s/', '"')[0]
+            self.image_token = text.extr(gpage, 'hentai.org/s/', '"')
             if not self.image_token:
                 self.log.error("Failed to extract initial image token")
                 self.log.debug("Page content:\n%s", gpage)
@@ -193,7 +193,7 @@
             ipage = self._image_page()
         else:
             ipage = self._image_page()
-            part = text.extract(ipage, 'hentai.org/g/', '"')[0]
+            part = text.extr(ipage, 'hentai.org/g/', '"')
             if not part:
                 self.log.error("Failed to extract gallery token")
                 self.log.debug("Page content:\n%s", ipage)
@@ -271,8 +271,8 @@
         }
 
         if data["uploader"].startswith("<"):
-            data["uploader"] = text.unescape(text.extract(
-                data["uploader"], ">", "<")[0])
+            data["uploader"] = text.unescape(text.extr(
+                data["uploader"], ">", "<"))
 
         f = data["favorites"][0]
         if f == "N":
@@ -400,7 +400,7 @@
         }
 
         page = self.request(url, cookies=cookies).text
-        current = text.extract(page, "<strong>", "</strong>")[0]
+        current = text.extr(page, "<strong>", "</strong>")
         self.log.debug("Image Limits: %s/%s", current, self.limits)
         self._remaining = self.limits - text.parse_int(current)
 
@@ -473,6 +473,10 @@
             "pattern": ExhentaiGalleryExtractor.pattern,
             "range": "1-30",
             "count": 30,
+            "keyword": {
+                "gallery_id": int,
+                "gallery_token": r"re:^[0-9a-f]{10}$"
+            },
         }),
     )
 
@@ -490,26 +494,39 @@
             self.params = {"f_search": tag, "page": 0}
         else:
             self.params = text.parse_query(query)
-            self.params["page"] = text.parse_int(self.params.get("page"))
+            if "next" not in self.params:
+                self.params["page"] = text.parse_int(self.params.get("page"))
 
     def items(self):
         self.login()
         data = {"_extractor": ExhentaiGalleryExtractor}
+        search_url = self.search_url
+        params = self.params
 
         while True:
             last = None
-            page = self.request(self.search_url, params=self.params).text
+            page = self.request(search_url, params=params).text
 
             for gallery in ExhentaiGalleryExtractor.pattern.finditer(page):
                 url = gallery.group(0)
                 if url == last:
                     continue
                 last = url
+                data["gallery_id"] = text.parse_int(gallery.group(2))
+                data["gallery_token"] = gallery.group(3)
                 yield Message.Queue, url + "/", data
 
-            if 'class="ptdd">&gt;<' in page or ">No hits found</p>" in page:
+            next_url = text.extr(page, 'nexturl = "', '"', None)
+            if next_url is not None:
+                if not next_url:
+                    return
+                search_url = next_url
+                params = None
+
+            elif 'class="ptdd">&gt;<' in page or ">No hits found</p>" in page:
                 return
-            self.params["page"] += 1
+            else:
+                params["page"] += 1
 
 
 class ExhentaiFavoriteExtractor(ExhentaiSearchExtractor):
diff -Nru gallery-dl-1.23.2/gallery_dl/extractor/fallenangels.py gallery-dl-1.24.0/gallery_dl/extractor/fallenangels.py
--- gallery-dl-1.23.2/gallery_dl/extractor/fallenangels.py	2021-12-11 02:38:22.000000000 +0000
+++ gallery-dl-1.24.0/gallery_dl/extractor/fallenangels.py	2022-11-10 12:38:30.000000000 +0000
@@ -57,7 +57,7 @@
         return [
             (img["page_image"], None)
             for img in json.loads(
-                text.extract(page, "var pages = ", ";")[0]
+                text.extr(page, "var pages = ", ";")
             )
         ]
 
diff -Nru gallery-dl-1.23.2/gallery_dl/extractor/fanbox.py gallery-dl-1.24.0/gallery_dl/extractor/fanbox.py
--- gallery-dl-1.23.2/gallery_dl/extractor/fanbox.py	2022-08-27 18:29:11.000000000 +0000
+++ gallery-dl-1.24.0/gallery_dl/extractor/fanbox.py	2022-11-08 16:10:24.000000000 +0000
@@ -68,6 +68,16 @@
                 post["html"] = content_body["html"]
             if post["type"] == "article":
                 post["articleBody"] = content_body.copy()
+            if "blocks" in content_body:
+                content = []
+                append = content.append
+                for block in content_body["blocks"]:
+                    if "text" in block:
+                        append(block["text"])
+                    if "links" in block:
+                        for link in block["links"]:
+                            append(link["url"])
+                post["content"] = "\n".join(content)
 
         post["date"] = text.parse_datetime(post["publishedDatetime"])
         post["text"] = content_body.get("text") if content_body else None
@@ -271,6 +281,19 @@
                 "hasAdultContent": True
             },
         }),
+        # 'content' metadata (#3020)
+        ("https://www.fanbox.cc/@official-en/posts/4326303", {
+            "keyword": {
+                "content": r"re:(?s)^Greetings from FANBOX.\n \nAs of Monday, "
+                           r"September 5th, 2022, we are happy to announce "
+                           r"the start of the FANBOX hashtag event "
+                           r"#MySetupTour ! \nAbout the event\nTo join this "
+                           r"event .+ \nPlease check this page for further "
+                           r"details regarding the Privacy & Terms.\n"
+                           r"https://fanbox.pixiv.help/.+/10184952456601\n\n\n"
+                           r"Thank you for your continued support of FANBOX.$",
+            },
+        }),
     )
 
     def __init__(self, match):
diff -Nru gallery-dl-1.23.2/gallery_dl/extractor/foolfuuka.py gallery-dl-1.24.0/gallery_dl/extractor/foolfuuka.py
--- gallery-dl-1.23.2/gallery_dl/extractor/foolfuuka.py	2022-08-27 18:29:11.000000000 +0000
+++ gallery-dl-1.24.0/gallery_dl/extractor/foolfuuka.py	2022-11-10 12:38:30.000000000 +0000
@@ -56,7 +56,7 @@
         """Resolve a remote media link"""
         needle = '<meta http-equiv="Refresh" content="0; url='
         page = self.request(media["remote_media_link"]).text
-        return text.extract(page, needle, '"')[0]
+        return text.extr(page, needle, '"')
 
     @staticmethod
     def _remote_direct(media):
diff -Nru gallery-dl-1.23.2/gallery_dl/extractor/foolslide.py gallery-dl-1.24.0/gallery_dl/extractor/foolslide.py
--- gallery-dl-1.23.2/gallery_dl/extractor/foolslide.py	2022-05-30 10:58:03.000000000 +0000
+++ gallery-dl-1.24.0/gallery_dl/extractor/foolslide.py	2022-11-10 12:38:30.000000000 +0000
@@ -114,7 +114,7 @@
         })
 
     def images(self, page):
-        return json.loads(text.extract(page, "var pages = ", ";")[0])
+        return json.loads(text.extr(page, "var pages = ", ";"))
 
 
 class FoolslideMangaExtractor(FoolslideExtractor):
diff -Nru gallery-dl-1.23.2/gallery_dl/extractor/furaffinity.py gallery-dl-1.24.0/gallery_dl/extractor/furaffinity.py
--- gallery-dl-1.23.2/gallery_dl/extractor/furaffinity.py	2022-05-30 10:58:03.000000000 +0000
+++ gallery-dl-1.24.0/gallery_dl/extractor/furaffinity.py	2022-11-10 12:38:30.000000000 +0000
@@ -160,7 +160,7 @@
         while path:
             page = self.request(self.root + path).text
             yield from text.extract_iter(page, 'id="sid-', '"')
-            path = text.extract(page, 'right" href="', '"')[0]
+            path = text.extr(page, 'right" href="', '"')
 
     def _pagination_search(self, query):
         url = self.root + "/search/"
diff -Nru gallery-dl-1.23.2/gallery_dl/extractor/fuskator.py gallery-dl-1.24.0/gallery_dl/extractor/fuskator.py
--- gallery-dl-1.23.2/gallery_dl/extractor/fuskator.py	2021-12-11 02:38:22.000000000 +0000
+++ gallery-dl-1.24.0/gallery_dl/extractor/fuskator.py	2022-11-10 12:38:30.000000000 +0000
@@ -58,7 +58,7 @@
             self.root + "/ajax/gal.aspx", params=params, headers=headers,
         ).json()
 
-        title = text.extract(page, "<title>", "</title>")[0].strip()
+        title = text.extr(page, "<title>", "</title>").strip()
         title, _, gallery_id = title.rpartition("#")
 
         return {
@@ -104,7 +104,7 @@
                     page, 'class="pic_pad"><a href="', '"'):
                 yield Message.Queue, self.root + path, data
 
-            pages = text.extract(page, 'class="pages"><span>', '>&gt;&gt;<')[0]
+            pages = text.extr(page, 'class="pages"><span>', '>&gt;&gt;<')
             if not pages:
                 return
             url = self.root + text.rextract(pages, 'href="', '"')[0]
diff -Nru gallery-dl-1.23.2/gallery_dl/extractor/gelbooru.py gallery-dl-1.24.0/gallery_dl/extractor/gelbooru.py
--- gallery-dl-1.23.2/gallery_dl/extractor/gelbooru.py	2022-08-27 18:29:11.000000000 +0000
+++ gallery-dl-1.24.0/gallery_dl/extractor/gelbooru.py	2022-11-10 12:38:30.000000000 +0000
@@ -68,6 +68,22 @@
         yield "https://img2.gelbooru.com" + path
         yield "https://img1.gelbooru.com" + path
 
+    def _notes(self, post, page):
+        notes_data = text.extr(page, '<section id="notes"', '</section>')
+        if not notes_data:
+            return
+
+        post["notes"] = notes = []
+        extr = text.extract
+        for note in text.extract_iter(notes_data, '<article', '</article>'):
+            notes.append({
+                "width" : int(extr(note, 'data-width="', '"')[0]),
+                "height": int(extr(note, 'data-height="', '"')[0]),
+                "x"     : int(extr(note, 'data-x="', '"')[0]),
+                "y"     : int(extr(note, 'data-y="', '"')[0]),
+                "body"  : extr(note, 'data-body="', '"')[0],
+            })
+
 
 class GelbooruTagExtractor(GelbooruBase,
                            gelbooru_v02.GelbooruV02TagExtractor):
@@ -142,13 +158,23 @@
 class GelbooruPostExtractor(GelbooruBase,
                             gelbooru_v02.GelbooruV02PostExtractor):
     """Extractor for single images from gelbooru.com"""
-    pattern = (r"(?:https?://)?(?:www\.)?gelbooru\.com/(?:index\.php)?"
-               r"\?page=post&s=view&id=(?P<post>\d+)")
+    pattern = (r"(?:https?://)?(?:www\.)?gelbooru\.com/(?:index\.php)?\?"
+               r"(?=(?:[^#]+&)?page=post(?:&|#|$))"
+               r"(?=(?:[^#]+&)?s=view(?:&|#|$))"
+               r"(?:[^#]+&)?id=(\d+)")
     test = (
         ("https://gelbooru.com/index.php?page=post&s=view&id=313638", {
             "content": "5e255713cbf0a8e0801dc423563c34d896bb9229",
             "count": 1,
         }),
+
+        ("https://gelbooru.com/index.php?page=post&s=view&id=313638"),
+        ("https://gelbooru.com/index.php?s=view&page=post&id=313638"),
+        ("https://gelbooru.com/index.php?page=post&id=313638&s=view"),
+        ("https://gelbooru.com/index.php?s=view&id=313638&page=post"),
+        ("https://gelbooru.com/index.php?id=313638&page=post&s=view"),
+        ("https://gelbooru.com/index.php?id=313638&s=view&page=post"),
+
         ("https://gelbooru.com/index.php?page=post&s=view&id=6018318", {
             "options": (("tags", True),),
             "content": "977caf22f27c72a5d07ea4d4d9719acdab810991",
@@ -172,21 +198,21 @@
             "keywords": {
                 "notes": [
                     {
-                        "height": 553,
                         "body": "Look over this way when you talk~",
+                        "height": 553,
                         "width": 246,
                         "x": 35,
-                        "y": 72
+                        "y": 72,
                     },
                     {
-                        "height": 557,
                         "body": "Hey~\nAre you listening~?",
+                        "height": 557,
                         "width": 246,
                         "x": 1233,
-                        "y": 109
-                    }
-                ]
-            }
+                        "y": 109,
+                    },
+                ],
+            },
         }),
     )
 
diff -Nru gallery-dl-1.23.2/gallery_dl/extractor/gelbooru_v02.py gallery-dl-1.24.0/gallery_dl/extractor/gelbooru_v02.py
--- gallery-dl-1.23.2/gallery_dl/extractor/gelbooru_v02.py	2022-10-01 10:34:23.000000000 +0000
+++ gallery-dl-1.24.0/gallery_dl/extractor/gelbooru_v02.py	2022-11-10 16:03:18.000000000 +0000
@@ -31,6 +31,7 @@
 
         if self.category == "realbooru":
             self._file_url = self._file_url_realbooru
+            self._tags = self._tags_realbooru
 
     def _api_request(self, params):
         url = self.api_root + "/index.php?page=dapi&s=post&q=index"
@@ -85,55 +86,58 @@
         post["date"] = text.parse_datetime(
             post["created_at"], "%a %b %d %H:%M:%S %z %Y")
 
+    def _html(self, post):
+        return self.request("{}/index.php?page=post&s=view&id={}".format(
+            self.root, post["id"])).text
+
+    def _tags(self, post, page):
+        tag_container = (text.extr(page, '<ul id="tag-', '</ul>') or
+                         text.extr(page, '<ul class="tag-', '</ul>'))
+        if not tag_container:
+            return
+
+        tags = collections.defaultdict(list)
+        pattern = re.compile(
+            r"tag-type-([^\"' ]+).*?[?;]tags=([^\"'&]+)", re.S)
+        for tag_type, tag_name in pattern.findall(tag_container):
+            tags[tag_type].append(text.unquote(tag_name))
+        for key, value in tags.items():
+            post["tags_" + key] = " ".join(value)
+
+    def _notes(self, post, page):
+        note_container = text.extr(page, 'id="note-container"', "<img ")
+        if not note_container:
+            return
+
+        post["notes"] = notes = []
+        for note in note_container.split('class="note-box"')[1:]:
+            extr = text.extract_from(note)
+            notes.append({
+                "width" : int(extr("width:", "p")),
+                "height": int(extr("height:", "p")),
+                "y"     : int(extr("top:", "p")),
+                "x"     : int(extr("left:", "p")),
+                "id"    : int(extr('id="note-body-', '"')),
+                "body"  : text.unescape(text.remove_html(extr(">", "</div>"))),
+            })
+
     def _file_url_realbooru(self, post):
         url = post["file_url"]
-        if url.count("/") == 5:
-            md5 = post["md5"]
+        md5 = post["md5"]
+        if md5 not in post["preview_url"] or url.count("/") == 5:
             url = "{}/images/{}/{}/{}.{}".format(
                 self.root, md5[0:2], md5[2:4], md5, url.rpartition(".")[2])
         return url
 
-    def _extended_tags(self, post, page=None):
-        if not page:
-            url = "{}/index.php?page=post&s=view&id={}".format(
-                self.root, post["id"])
-            page = self.request(url).text
-        html = text.extract(page, '<ul id="tag-', '</ul>')[0]
-        if not html:
-            html = text.extract(page, '<ul class="tag-', '</ul>')[0]
-        if html:
-            tags = collections.defaultdict(list)
-            pattern = re.compile(
-                r"tag-type-([^\"' ]+).*?[?;]tags=([^\"'&]+)", re.S)
-            for tag_type, tag_name in pattern.findall(html):
-                tags[tag_type].append(text.unquote(tag_name))
-            for key, value in tags.items():
-                post["tags_" + key] = " ".join(value)
-        return page
-
-    def _notes(self, post, page=None):
-        if not page:
-            url = "{}/index.php?page=post&s=view&id={}".format(
-                self.root, post["id"])
-            page = self.request(url).text
-        notes = []
-        notes_data = text.extract(page, '<section id="notes"', '</section>')[0]
-        if not notes_data:
-            return
-
-        note_iter = text.extract_iter(notes_data, '<article', '</article>')
-        extr = text.extract
-        for note_data in note_iter:
-            note = {
-                "width": int(extr(note_data, 'data-width="', '"')[0]),
-                "height": int(extr(note_data, 'data-height="', '"')[0]),
-                "x": int(extr(note_data, 'data-x="', '"')[0]),
-                "y": int(extr(note_data, 'data-y="', '"')[0]),
-                "body": extr(note_data, 'data-body="', '"')[0],
-            }
-            notes.append(note)
-
-        post["notes"] = notes
+    def _tags_realbooru(self, post, page):
+        tag_container = text.extr(page, 'id="tagLink"', '</div>')
+        tags = collections.defaultdict(list)
+        pattern = re.compile(
+            r'<a class="(?:tag-type-)?([^"]+).*?;tags=([^"&]+)')
+        for tag_type, tag_name in pattern.findall(tag_container):
+            tags[tag_type].append(text.unquote(tag_name))
+        for key, value in tags.items():
+            post["tags_" + key] = " ".join(value)
 
 
 INSTANCES = {
@@ -310,15 +314,81 @@
     archive_fmt = "{id}"
     pattern = BASE_PATTERN + r"/index\.php\?page=post&s=view&id=(\d+)"
     test = (
-        ("https://rule34.xxx/index.php?page=post&s=view&id=1995545", {
-            "content": "97e4bbf86c3860be18de384d02d544251afe1d45",
-            "options": (("tags", True),),
+        ("https://rule34.xxx/index.php?page=post&s=view&id=863", {
+            "pattern": r"https://api-cdn\.rule34\.xxx/images"
+                       r"/1/6aafbdb3e22f3f3b412ea2cf53321317a37063f3\.jpg",
+            "content": ("a43f418aa350039af0d11cae501396a33bbe2201",
+                        "67b516295950867e1c1ab6bc13b35d3b762ed2a3"),
+            "options": (("tags", True), ("notes", True)),
             "keyword": {
-                "tags_artist": "danraku",
-                "tags_character": "kashima_(kantai_collection)",
-                "tags_copyright": "kantai_collection",
+                "tags_artist": "reverse_noise yamu_(reverse_noise)",
+                "tags_character": "hong_meiling",
+                "tags_copyright": "touhou",
                 "tags_general": str,
-                "tags_metadata": str,
+                "tags_metadata": "censored translated",
+                "notes": [
+                    {
+                        "body": "It feels angry, I'm losing myself... "
+                                "It won't calm down!",
+                        "height": 65,
+                        "id": 93586,
+                        "width": 116,
+                        "x": 22,
+                        "y": 333,
+                    },
+                    {
+                        "body": "REPUTATION OF RAGE",
+                        "height": 272,
+                        "id": 93587,
+                        "width": 199,
+                        "x": 78,
+                        "y": 442,
+                    },
+                ],
+
+            },
+        }),
+        ("https://hypnohub.net/index.php?page=post&s=view&id=1439", {
+            "pattern": r"https://hypnohub\.net/images"
+                       r"/90/24/90245c3c5250c2a8173255d3923a010b\.jpg",
+            "content": "5987c5d2354f22e5fa9b7ee7ce4a6f7beb8b2b71",
+            "options": (("tags", True), ("notes", True)),
+            "keyword": {
+                "tags_artist": "brokenteapot",
+                "tags_character": "hsien-ko",
+                "tags_copyright": "capcom darkstalkers",
+                "tags_general": str,
+                "tags_metadata": "dialogue text translated",
+                "notes": [
+                    {
+                        "body": "Master Master Master "
+                                "Master Master Master",
+                        "height": 83,
+                        "id": 10577,
+                        "width": 129,
+                        "x": 259,
+                        "y": 20,
+                    },
+                    {
+                        "body": "Response Response Response "
+                                "Response Response Response",
+                        "height": 86,
+                        "id": 10578,
+                        "width": 125,
+                        "x": 126,
+                        "y": 20,
+                    },
+                    {
+                        "body": "Obedience Obedience Obedience "
+                                "Obedience Obedience Obedience",
+                        "height": 80,
+                        "id": 10579,
+                        "width": 98,
+                        "x": 20,
+                        "y": 20,
+                    },
+                ],
+
             },
         }),
         ("https://safebooru.org/index.php?page=post&s=view&id=1169132", {
@@ -336,16 +406,18 @@
             "pattern": r"https://realbooru\.com/images/dc/b5"
                        r"/dcb5c0ce9ec0bf74a6930608985f4719\.jpeg",
             "content": "7f5873ce3b6cd295ea2e81fcb49583098ea9c8da",
+            "options": (("tags", True),),
+            "keyword": {
+                "tags_general": "1girl blonde blonde_hair blue_eyes cute "
+                                "female female_only looking_at_viewer smile "
+                                "solo solo_female teeth",
+                "tags_model": "jennifer_lawrence",
+            },
         }),
         ("https://tbib.org/index.php?page=post&s=view&id=9233957", {
             "url": "5a6ebe07bfff8e6d27f7c30b5480f27abcb577d2",
             "content": "1c3831b6fbaa4686e3c79035b5d98460b1c85c43",
         }),
-        ("https://hypnohub.net/index.php?page=post&s=view&id=73964", {
-            "pattern": r"https://hypnohub\.net/images/7a/37"
-                       r"/7a37c0ba372f35767fb10c904a398831\.png",
-            "content": "02d5f5a8396b621a6efc04c5f8ef1b7225dfc6ee",
-        }),
     )
 
     def __init__(self, match):
diff -Nru gallery-dl-1.23.2/gallery_dl/extractor/generic.py gallery-dl-1.24.0/gallery_dl/extractor/generic.py
--- gallery-dl-1.23.2/gallery_dl/extractor/generic.py	2022-05-27 13:20:33.000000000 +0000
+++ gallery-dl-1.24.0/gallery_dl/extractor/generic.py	2022-11-10 12:38:30.000000000 +0000
@@ -27,9 +27,9 @@
     pattern += r"""
         (?P<scheme>https?://)?          # optional http(s) scheme
         (?P<domain>[-\w\.]+)            # required domain
-        (?P<path>/[^?&#]*)?             # optional path
-        (?:\?(?P<query>[^/?#]*))?       # optional query
-        (?:\#(?P<fragment>.*))?$        # optional fragment
+        (?P<path>/[^?#]*)?              # optional path
+        (?:\?(?P<query>[^#]*))?         # optional query
+        (?:\#(?P<fragment>.*))?         # optional fragment
         """
 
     def __init__(self, match):
@@ -87,25 +87,25 @@
         """Extract generic webpage metadata, return them in a dict."""
         data = {}
         data['pageurl'] = self.url
-        data['title'] = text.extract(page, '<title>', "</title>")[0] or ""
-        data['description'] = text.extract(
-            page, '<meta name="description" content="', '"')[0] or ""
-        data['keywords'] = text.extract(
-            page, '<meta name="keywords" content="', '"')[0] or ""
-        data['language'] = text.extract(
-            page, '<meta name="language" content="', '"')[0] or ""
-        data['name'] = text.extract(
-            page, '<meta itemprop="name" content="', '"')[0] or ""
-        data['copyright'] = text.extract(
-            page, '<meta name="copyright" content="', '"')[0] or ""
-        data['og_site'] = text.extract(
-            page, '<meta property="og:site" content="', '"')[0] or ""
-        data['og_site_name'] = text.extract(
-            page, '<meta property="og:site_name" content="', '"')[0] or ""
-        data['og_title'] = text.extract(
-            page, '<meta property="og:title" content="', '"')[0] or ""
-        data['og_description'] = text.extract(
-            page, '<meta property="og:description" content="', '"')[0] or ""
+        data['title'] = text.extr(page, '<title>', "</title>")
+        data['description'] = text.extr(
+            page, '<meta name="description" content="', '"')
+        data['keywords'] = text.extr(
+            page, '<meta name="keywords" content="', '"')
+        data['language'] = text.extr(
+            page, '<meta name="language" content="', '"')
+        data['name'] = text.extr(
+            page, '<meta itemprop="name" content="', '"')
+        data['copyright'] = text.extr(
+            page, '<meta name="copyright" content="', '"')
+        data['og_site'] = text.extr(
+            page, '<meta property="og:site" content="', '"')
+        data['og_site_name'] = text.extr(
+            page, '<meta property="og:site_name" content="', '"')
+        data['og_title'] = text.extr(
+            page, '<meta property="og:title" content="', '"')
+        data['og_description'] = text.extr(
+            page, '<meta property="og:description" content="', '"')
 
         data = {k: text.unescape(data[k]) for k in data if data[k] != ""}
 
diff -Nru gallery-dl-1.23.2/gallery_dl/extractor/hentai2read.py gallery-dl-1.24.0/gallery_dl/extractor/hentai2read.py
--- gallery-dl-1.23.2/gallery_dl/extractor/hentai2read.py	2021-12-11 02:38:22.000000000 +0000
+++ gallery-dl-1.24.0/gallery_dl/extractor/hentai2read.py	2022-11-08 16:10:24.000000000 +0000
@@ -1,12 +1,12 @@
 # -*- coding: utf-8 -*-
 
-# Copyright 2016-2019 Mike Fährmann
+# Copyright 2016-2022 Mike Fährmann
 #
 # This program is free software; you can redistribute it and/or modify
 # it under the terms of the GNU General Public License version 2 as
 # published by the Free Software Foundation.
 
-"""Extract hentai-manga from https://hentai2read.com/"""
+"""Extractors for https://hentai2read.com/"""
 
 from .common import ChapterExtractor, MangaExtractor
 from .. import text
@@ -23,11 +23,32 @@
 class Hentai2readChapterExtractor(Hentai2readBase, ChapterExtractor):
     """Extractor for a single manga chapter from hentai2read.com"""
     archive_fmt = "{chapter_id}_{page}"
-    pattern = r"(?:https?://)?(?:www\.)?hentai2read\.com(/[^/?#]+/(\d+))"
-    test = ("https://hentai2read.com/amazon_elixir/1/", {
-        "url": "964b942cf492b3a129d2fe2608abfc475bc99e71",
-        "keyword": "ff84b8f751f0e4ee37717efc4332ff1db71951d9",
-    })
+    pattern = r"(?:https?://)?(?:www\.)?hentai2read\.com(/[^/?#]+/([^/?#]+))"
+    test = (
+        ("https://hentai2read.com/amazon_elixir/1/", {
+            "url": "964b942cf492b3a129d2fe2608abfc475bc99e71",
+            "keyword": "85645b02d34aa11b3deb6dadd7536863476e1bad",
+        }),
+        ("https://hentai2read.com/popuni_kei_joshi_panic/2.5/", {
+            "pattern": r"https://hentaicdn\.com/hentai"
+                       r"/13088/2\.5y/ccdn00\d+\.jpg",
+            "count": 36,
+            "keyword": {
+                "author": "Kurisu",
+                "chapter": 2,
+                "chapter_id": 75152,
+                "chapter_minor": ".5",
+                "count": 36,
+                "lang": "en",
+                "language": "English",
+                "manga": "Popuni Kei Joshi Panic!",
+                "manga_id": 13088,
+                "page": int,
+                "title": "Popuni Kei Joshi Panic! 2.5",
+                "type": "Original",
+            },
+        }),
+    )
 
     def __init__(self, match):
         self.chapter = match.group(2)
@@ -37,12 +58,14 @@
         title, pos = text.extract(page, "<title>", "</title>")
         manga_id, pos = text.extract(page, 'data-mid="', '"', pos)
         chapter_id, pos = text.extract(page, 'data-cid="', '"', pos)
+        chapter, sep, minor = self.chapter.partition(".")
         match = re.match(r"Reading (.+) \(([^)]+)\) Hentai(?: by (.+))? - "
-                         r"(\d+): (.+) . Page 1 ", title)
+                         r"([^:]+): (.+) . Page 1 ", title)
         return {
             "manga": match.group(1),
             "manga_id": text.parse_int(manga_id),
-            "chapter": text.parse_int(self.chapter),
+            "chapter": text.parse_int(chapter),
+            "chapter_minor": sep + minor,
             "chapter_id": text.parse_int(chapter_id),
             "type": match.group(2),
             "author": match.group(3),
@@ -51,8 +74,7 @@
             "language": "English",
         }
 
-    @staticmethod
-    def images(page):
+    def images(self, page):
         images = text.extract(page, "'images' : ", ",\n")[0]
         return [
             ("https://hentaicdn.com/hentai" + part, None)
@@ -67,18 +89,35 @@
     test = (
         ("https://hentai2read.com/amazon_elixir/", {
             "url": "273073752d418ec887d7f7211e42b832e8c403ba",
-            "keyword": "13c1ce7e15cbb941f01c843b0e89adc993d939ac",
+            "keyword": "5c1b712258e78e120907121d3987c71f834d13e1",
         }),
         ("https://hentai2read.com/oshikage_riot/", {
             "url": "6595f920a3088a15c2819c502862d45f8eb6bea6",
-            "keyword": "675c7b7a4fa52cf569c283553bd16b4200a5cd36",
+            "keyword": "a2e9724acb221040d4b29bf9aa8cb75b2240d8af",
+        }),
+        ("https://hentai2read.com/popuni_kei_joshi_panic/", {
+            "pattern": Hentai2readChapterExtractor.pattern,
+            "range": "2-3",
+            "keyword": {
+                "chapter": int,
+                "chapter_id": int,
+                "chapter_minor": ".5",
+                "lang": "en",
+                "language": "English",
+                "manga": "Popuni Kei Joshi Panic!",
+                "manga_id": 13088,
+                "title": str,
+                "type": "Original",
+            },
         }),
     )
 
     def chapters(self, page):
         results = []
+
+        pos = page.find('itemscope itemtype="http://schema.org/Book') + 1
         manga, pos = text.extract(
-            page, '<span itemprop="name">', '</span>')
+            page, '<span itemprop="name">', '</span>', pos)
         mtype, pos = text.extract(
             page, '<small class="text-danger">[', ']</small>', pos)
         manga_id = text.parse_int(text.extract(
@@ -90,12 +129,19 @@
                 return results
             _  , pos = text.extract(page, ' href="', '"', pos)
             url, pos = text.extract(page, ' href="', '"', pos)
-            chapter, pos = text.extract(page, '>', '<', pos)
 
+            chapter, pos = text.extract(page, '>', '<', pos)
             chapter, _, title = text.unescape(chapter).strip().partition(" - ")
+            chapter, sep, minor = chapter.partition(".")
+
             results.append((url, {
-                "manga_id": manga_id, "manga": manga, "type": mtype,
-                "chapter_id": text.parse_int(chapter_id),
+                "manga": manga,
+                "manga_id": manga_id,
                 "chapter": text.parse_int(chapter),
-                "title": title, "lang": "en", "language": "English",
+                "chapter_minor": sep + minor,
+                "chapter_id": text.parse_int(chapter_id),
+                "type": mtype,
+                "title": title,
+                "lang": "en",
+                "language": "English",
             }))
diff -Nru gallery-dl-1.23.2/gallery_dl/extractor/hentaicosplays.py gallery-dl-1.24.0/gallery_dl/extractor/hentaicosplays.py
--- gallery-dl-1.23.2/gallery_dl/extractor/hentaicosplays.py	2022-05-03 10:22:33.000000000 +0000
+++ gallery-dl-1.24.0/gallery_dl/extractor/hentaicosplays.py	2022-11-10 12:38:30.000000000 +0000
@@ -60,7 +60,7 @@
         self.session.headers["Referer"] = url
 
     def metadata(self, page):
-        title = text.extract(page, "<title>", "</title>")[0]
+        title = text.extr(page, "<title>", "</title>")
         return {
             "title": text.unescape(title.rpartition(" Story Viewer - ")[0]),
             "slug" : self.slug,
diff -Nru gallery-dl-1.23.2/gallery_dl/extractor/hentaifoundry.py gallery-dl-1.24.0/gallery_dl/extractor/hentaifoundry.py
--- gallery-dl-1.23.2/gallery_dl/extractor/hentaifoundry.py	2022-07-12 20:18:44.000000000 +0000
+++ gallery-dl-1.24.0/gallery_dl/extractor/hentaifoundry.py	2022-11-10 12:38:30.000000000 +0000
@@ -156,8 +156,8 @@
             "filter_media"    : "A",
             "filter_order"    : "date_new",
             "filter_type"     : "0",
-            "YII_CSRF_TOKEN"  : text.unquote(text.extract(
-                csrf_token, "%22", "%22")[0]),
+            "YII_CSRF_TOKEN"  : text.unquote(text.extr(
+                csrf_token, "%22", "%22")),
         }
         self.request(url, method="POST", data=data)
 
diff -Nru gallery-dl-1.23.2/gallery_dl/extractor/hentaihere.py gallery-dl-1.24.0/gallery_dl/extractor/hentaihere.py
--- gallery-dl-1.23.2/gallery_dl/extractor/hentaihere.py	2021-12-11 02:38:22.000000000 +0000
+++ gallery-dl-1.24.0/gallery_dl/extractor/hentaihere.py	2022-11-10 12:38:30.000000000 +0000
@@ -1,12 +1,12 @@
 # -*- coding: utf-8 -*-
 
-# Copyright 2016-2019 Mike Fährmann
+# Copyright 2016-2022 Mike Fährmann
 #
 # This program is free software; you can redistribute it and/or modify
 # it under the terms of the GNU General Public License version 2 as
 # published by the Free Software Foundation.
 
-"""Extract hentai-manga from https://hentaihere.com/"""
+"""Extractors for https://hentaihere.com/"""
 
 from .common import ChapterExtractor, MangaExtractor
 from .. import text
@@ -23,11 +23,33 @@
 class HentaihereChapterExtractor(HentaihereBase, ChapterExtractor):
     """Extractor for a single manga chapter from hentaihere.com"""
     archive_fmt = "{chapter_id}_{page}"
-    pattern = r"(?:https?://)?(?:www\.)?hentaihere\.com/m/S(\d+)/(\d+)"
-    test = ("https://hentaihere.com/m/S13812/1/1/", {
-        "url": "964b942cf492b3a129d2fe2608abfc475bc99e71",
-        "keyword": "cbcee0c0eb178c4b87f06a834085784f8dddad24",
-    })
+    pattern = r"(?:https?://)?(?:www\.)?hentaihere\.com/m/S(\d+)/([^/?#]+)"
+    test = (
+        ("https://hentaihere.com/m/S13812/1/1/", {
+            "url": "964b942cf492b3a129d2fe2608abfc475bc99e71",
+            "keyword": "0207d20eea3a15d2a8d1496755bdfa49de7cfa9d",
+        }),
+        ("https://hentaihere.com/m/S23048/1.5/1/", {
+            "pattern": r"https://hentaicdn\.com/hentai"
+                       r"/23048/1\.5/ccdn00\d+\.jpg",
+            "count": 32,
+            "keyword": {
+                "author": "Shinozuka Yuuji",
+                "chapter": 1,
+                "chapter_id": 80186,
+                "chapter_minor": ".5",
+                "count": 32,
+                "lang": "en",
+                "language": "English",
+                "manga": "High School Slut's Love Consultation",
+                "manga_id": 23048,
+                "page": int,
+                "title": "High School Slut's Love Consultation + "
+                         "Girlfriend [Full Color]",
+                "type": "Original",
+            },
+        }),
+    )
 
     def __init__(self, match):
         self.manga_id, self.chapter = match.groups()
@@ -35,14 +57,16 @@
         ChapterExtractor.__init__(self, match, url)
 
     def metadata(self, page):
-        title = text.extract(page, "<title>", "</title>")[0]
-        chapter_id = text.extract(page, 'report/C', '"')[0]
+        title = text.extr(page, "<title>", "</title>")
+        chapter_id = text.extr(page, 'report/C', '"')
+        chapter, sep, minor = self.chapter.partition(".")
         pattern = r"Page 1 \| (.+) \(([^)]+)\) - Chapter \d+: (.+) by (.+) at "
         match = re.match(pattern, title)
         return {
             "manga": match.group(1),
             "manga_id": text.parse_int(self.manga_id),
-            "chapter": text.parse_int(self.chapter),
+            "chapter": text.parse_int(chapter),
+            "chapter_minor": sep + minor,
             "chapter_id": text.parse_int(chapter_id),
             "type": match.group(2),
             "title": match.group(3),
@@ -53,7 +77,7 @@
 
     @staticmethod
     def images(page):
-        images = text.extract(page, "var rff_imageList = ", ";")[0]
+        images = text.extr(page, "var rff_imageList = ", ";")
         return [
             ("https://hentaicdn.com/hentai" + part, None)
             for part in json.loads(images)
@@ -67,22 +91,34 @@
     test = (
         ("https://hentaihere.com/m/S13812", {
             "url": "d1ba6e28bb2162e844f8559c2b2725ba0a093559",
-            "keyword": "13c1ce7e15cbb941f01c843b0e89adc993d939ac",
+            "keyword": "5c1b712258e78e120907121d3987c71f834d13e1",
         }),
         ("https://hentaihere.com/m/S7608", {
             "url": "6c5239758dc93f6b1b4175922836c10391b174f7",
-            "keyword": "675c7b7a4fa52cf569c283553bd16b4200a5cd36",
+            "keyword": {
+                "chapter": int,
+                "chapter_id": int,
+                "chapter_minor": "",
+                "lang": "en",
+                "language": "English",
+                "manga": "Oshikake Riot",
+                "manga_id": 7608,
+                "title": r"re:Oshikake Riot( \d+)?",
+                "type": "Original",
+            },
         }),
     )
 
     def chapters(self, page):
         results = []
-        manga_id = text.parse_int(
-            self.manga_url.rstrip("/").rpartition("/")[2][1:])
+
+        pos = page.find('itemscope itemtype="http://schema.org/Book') + 1
         manga, pos = text.extract(
-            page, '<span itemprop="name">', '</span>')
+            page, '<span itemprop="name">', '</span>', pos)
         mtype, pos = text.extract(
             page, '<span class="mngType text-danger">[', ']</span>', pos)
+        manga_id = text.parse_int(
+            self.manga_url.rstrip("/").rpartition("/")[2][1:])
 
         while True:
             marker, pos = text.extract(
@@ -90,12 +126,20 @@
             if marker is None:
                 return results
             url, pos = text.extract(page, '<a href="', '"', pos)
+
             chapter, pos = text.extract(page, 'title="Tagged: -">\n', '<', pos)
             chapter_id, pos = text.extract(page, '/C', '"', pos)
             chapter, _, title = text.unescape(chapter).strip().partition(" - ")
+            chapter, sep, minor = chapter.partition(".")
+
             results.append((url, {
-                "manga_id": manga_id, "manga": manga, "type": mtype,
-                "chapter_id": text.parse_int(chapter_id),
+                "manga_id": manga_id,
+                "manga": manga,
                 "chapter": text.parse_int(chapter),
-                "title": title, "lang": "en", "language": "English",
+                "chapter_minor": sep + minor,
+                "chapter_id": text.parse_int(chapter_id),
+                "type": mtype,
+                "title": title,
+                "lang": "en",
+                "language": "English",
             }))
diff -Nru gallery-dl-1.23.2/gallery_dl/extractor/hiperdex.py gallery-dl-1.24.0/gallery_dl/extractor/hiperdex.py
--- gallery-dl-1.23.2/gallery_dl/extractor/hiperdex.py	2022-05-03 10:22:33.000000000 +0000
+++ gallery-dl-1.24.0/gallery_dl/extractor/hiperdex.py	2022-11-10 12:38:30.000000000 +0000
@@ -139,7 +139,7 @@
         self.manga_data(self.manga, page)
         results = []
 
-        shortlink = text.extract(page, "rel='shortlink' href='", "'")[0]
+        shortlink = text.extr(page, "rel='shortlink' href='", "'")
         data = {
             "action"   : "manga_get_reading_nav",
             "manga"    : shortlink.rpartition("=")[2],
@@ -182,6 +182,6 @@
     def chapters(self, page):
         results = []
         for info in text.extract_iter(page, 'id="manga-item-', '<img'):
-            url = text.extract(info, 'href="', '"')[0]
+            url = text.extr(info, 'href="', '"')
             results.append((url, {}))
         return results
diff -Nru gallery-dl-1.23.2/gallery_dl/extractor/hitomi.py gallery-dl-1.24.0/gallery_dl/extractor/hitomi.py
--- gallery-dl-1.23.2/gallery_dl/extractor/hitomi.py	2022-08-28 15:05:24.000000000 +0000
+++ gallery-dl-1.24.0/gallery_dl/extractor/hitomi.py	2022-11-08 16:10:24.000000000 +0000
@@ -115,12 +115,16 @@
 
         fmt = self.config("format") or "webp"
         if fmt == "original":
-            subdomain, fmt, ext = "b", "images", None
+            subdomain, fmt, ext, check = "b", "images", None, False
         else:
-            subdomain, ext = "a", fmt
+            subdomain, ext, check = "a", fmt, True
 
         result = []
         for image in self.info["files"]:
+            if check:
+                if not image.get("has" + fmt):
+                    fmt = ext = "webp"
+                check = False
             ihash = image["hash"]
             idata = text.nameext_from_url(image["name"])
             if ext:
diff -Nru gallery-dl-1.23.2/gallery_dl/extractor/hotleak.py gallery-dl-1.24.0/gallery_dl/extractor/hotleak.py
--- gallery-dl-1.23.2/gallery_dl/extractor/hotleak.py	2022-09-30 14:46:45.000000000 +0000
+++ gallery-dl-1.24.0/gallery_dl/extractor/hotleak.py	2022-11-10 12:38:30.000000000 +0000
@@ -44,7 +44,7 @@
 
             for item in text.extract_iter(
                     page, '<article class="movie-item', '</article>'):
-                yield text.extract(item, '<a href="', '"')[0]
+                yield text.extr(item, '<a href="', '"')
 
             params["page"] += 1
 
@@ -87,8 +87,8 @@
         url = "{}/{}/{}/{}".format(
             self.root, self.creator, self.type, self.id)
         page = self.request(url).text
-        page = text.extract(
-            page, '<div class="movie-image thumb">', '</article>')[0]
+        page = text.extr(
+            page, '<div class="movie-image thumb">', '</article>')
         data = {
             "id"     : text.parse_int(self.id),
             "creator": self.creator,
@@ -96,12 +96,12 @@
         }
 
         if self.type == "photo":
-            data["url"] = text.extract(page, 'data-src="', '"')[0]
+            data["url"] = text.extr(page, 'data-src="', '"')
             text.nameext_from_url(data["url"], data)
 
         elif self.type == "video":
-            data["url"] = "ytdl:" + text.extract(
-                text.unescape(page), '"src":"', '"')[0]
+            data["url"] = "ytdl:" + text.extr(
+                text.unescape(page), '"src":"', '"')
             text.nameext_from_url(data["url"], data)
             data["extension"] = "mp4"
 
diff -Nru gallery-dl-1.23.2/gallery_dl/extractor/idolcomplex.py gallery-dl-1.24.0/gallery_dl/extractor/idolcomplex.py
--- gallery-dl-1.23.2/gallery_dl/extractor/idolcomplex.py	2022-02-01 23:09:19.000000000 +0000
+++ gallery-dl-1.24.0/gallery_dl/extractor/idolcomplex.py	2022-11-10 12:38:30.000000000 +0000
@@ -115,7 +115,7 @@
 
         if self.extags:
             tags = collections.defaultdict(list)
-            tags_html = text.extract(page, '<ul id=tag-sidebar>', '</ul>')[0]
+            tags_html = text.extr(page, '<ul id=tag-sidebar>', '</ul>')
             pattern = re.compile(r'tag-type-([^>]+)><a href="/\?tags=([^"]+)')
             for tag_type, tag_name in pattern.findall(tags_html or ""):
                 tags[tag_type].append(text.unquote(tag_name))
diff -Nru gallery-dl-1.23.2/gallery_dl/extractor/imagebam.py gallery-dl-1.24.0/gallery_dl/extractor/imagebam.py
--- gallery-dl-1.23.2/gallery_dl/extractor/imagebam.py	2022-05-03 10:22:33.000000000 +0000
+++ gallery-dl-1.24.0/gallery_dl/extractor/imagebam.py	2022-11-10 12:38:30.000000000 +0000
@@ -83,8 +83,8 @@
 
     @staticmethod
     def metadata(page):
-        return {"title": text.unescape(text.extract(
-            page, 'id="gallery-name">', '<')[0].strip())}
+        return {"title": text.unescape(text.extr(
+            page, 'id="gallery-name">', '<').strip())}
 
     def images(self, page):
         findall = re.compile(r'<a href="https://www\.imagebam\.com'
diff -Nru gallery-dl-1.23.2/gallery_dl/extractor/imagechest.py gallery-dl-1.24.0/gallery_dl/extractor/imagechest.py
--- gallery-dl-1.23.2/gallery_dl/extractor/imagechest.py	2021-12-11 02:38:22.000000000 +0000
+++ gallery-dl-1.24.0/gallery_dl/extractor/imagechest.py	2022-11-10 12:38:30.000000000 +0000
@@ -36,8 +36,8 @@
 
         return {
             "gallery_id": self.gallery_id,
-            "title": text.unescape(text.extract(
-                page, 'property="og:title" content="', '"')[0].strip())
+            "title": text.unescape(text.extr(
+                page, 'property="og:title" content="', '"').strip())
         }
 
     def images(self, page):
diff -Nru gallery-dl-1.23.2/gallery_dl/extractor/imagefap.py gallery-dl-1.24.0/gallery_dl/extractor/imagefap.py
--- gallery-dl-1.23.2/gallery_dl/extractor/imagefap.py	2022-07-12 13:49:22.000000000 +0000
+++ gallery-dl-1.24.0/gallery_dl/extractor/imagefap.py	2022-11-10 12:38:30.000000000 +0000
@@ -44,7 +44,9 @@
         ("https://www.imagefap.com/gallery/5486966", {
             "pattern": r"https://cdnh?\.imagefap\.com"
                        r"/images/full/\d+/\d+/\d+\.jpg",
-            "keyword": "3e24eace5b09639b881ebd393165862feb46adde",
+            "keyword": "8d2e562df7a0bc9e8eecb9d1bb68d32b4086bf98",
+            "archive": False,
+            "count": 62,
         }),
         ("https://www.imagefap.com/gallery.php?gid=7102714"),
         ("https://beta.imagefap.com/gallery.php?gid=7102714"),
@@ -73,32 +75,42 @@
 
         title, _, descr = descr.partition(" porn picture gallery by ")
         uploader, _, tags = descr.partition(" to see hottest ")
+        self._count = text.parse_int(count)
         return {
             "gallery_id": text.parse_int(self.gid),
             "title": text.unescape(title),
             "uploader": uploader,
             "tags": tags[:-11].split(", "),
-            "count": text.parse_int(count),
+            "count": self._count,
         }
 
     def get_images(self):
         """Collect image-urls and -metadata"""
-        num = 0
         url = "{}/photo/{}/".format(self.root, self.image_id)
         params = {"gid": self.gid, "idx": 0, "partial": "true"}
+        headers = {
+            "Content-Type": "application/x-www-form-urlencoded",
+            "X-Requested-With": "XMLHttpRequest",
+            "Referer": "{}?pgid=&gid={}&page=0".format(url, self.image_id)
+        }
+
+        num = 0
+        total = self._count
         while True:
-            pos = 0
-            page = self.request(url, params=params).text
-            for _ in range(24):
-                imgurl, pos = text.extract(page, '<a href="', '"', pos)
-                if not imgurl:
-                    return
+            page = self.request(url, params=params, headers=headers).text
+
+            cnt = 0
+            for image_url in text.extract_iter(page, '<a href="', '"'):
                 num += 1
-                data = text.nameext_from_url(imgurl)
+                cnt += 1
+                data = text.nameext_from_url(image_url)
                 data["num"] = num
                 data["image_id"] = text.parse_int(data["filename"])
-                yield imgurl, data
-            params["idx"] += 24
+                yield image_url, data
+
+            if cnt < 24 and num >= total:
+                return
+            params["idx"] += cnt
 
 
 class ImagefapImageExtractor(ImagefapExtractor):
@@ -170,40 +182,49 @@
         self.user, self.user_id = match.groups()
 
     def items(self):
-        for gid, name in self.get_gallery_data():
-            url = "{}/gallery/{}".format(self.root, gid)
-            data = {
-                "gallery_id": text.parse_int(gid),
-                "title": text.unescape(name),
-                "_extractor": ImagefapGalleryExtractor,
-            }
-            yield Message.Queue, url, data
-
-    def get_gallery_data(self):
-        """Yield all gallery_ids of a specific user"""
-        folders = self.get_gallery_folders()
-        url = "{}/ajax_usergallery_folder.php".format(self.root)
-        params = {"userid": self.user_id}
-        for folder_id in folders:
-            params["id"] = folder_id
-            page = self.request(url, params=params).text
-
-            pos = 0
-            while True:
-                gid, pos = text.extract(page, '<a  href="/gallery/', '"', pos)
-                if not gid:
-                    break
-                name, pos = text.extract(page, "<b>", "<", pos)
-                yield gid, name
+        for folder_id in self.folders():
+            for gallery_id, name in self.galleries(folder_id):
+                url = "{}/gallery/{}".format(self.root, gallery_id)
+                data = {
+                    "gallery_id": text.parse_int(gallery_id),
+                    "title"     : text.unescape(name),
+                    "_extractor": ImagefapGalleryExtractor,
+                }
+                yield Message.Queue, url, data
 
-    def get_gallery_folders(self):
-        """Create a list of all folder_ids of a specific user"""
+    def folders(self):
+        """Return a list of folder_ids of a specific user"""
         if self.user:
             url = "{}/profile/{}/galleries".format(self.root, self.user)
         else:
             url = "{}/usergallery.php?userid={}".format(
                 self.root, self.user_id)
-        page = self.request(url).text
-        self.user_id, pos = text.extract(page, '?userid=', '"')
-        folders, pos = text.extract(page, ' id="tgl_all" value="', '"', pos)
-        return folders.split("|")[:-1]
+
+        response = self.request(url)
+        self.user = response.url.split("/")[-2]
+        folders = text.extr(response.text, ' id="tgl_all" value="', '"')
+        return folders.rstrip("|").split("|")
+
+    def galleries(self, folder_id):
+        """Yield gallery_ids of a folder"""
+        if folder_id == "-1":
+            url = "{}/profile/{}/galleries?folderid=-1".format(
+                self.root, self.user)
+        else:
+            url = "{}/organizer/{}/".format(self.root, folder_id)
+        params = {"page": 0}
+
+        while True:
+            extr = text.extract_from(self.request(url, params=params).text)
+            cnt = 0
+
+            while True:
+                gid = extr('<a  href="/gallery/', '"')
+                if not gid:
+                    break
+                yield gid, extr("<b>", "<")
+                cnt += 1
+
+            if cnt < 25:
+                break
+            params["page"] += 1
diff -Nru gallery-dl-1.23.2/gallery_dl/extractor/imagehosts.py gallery-dl-1.24.0/gallery_dl/extractor/imagehosts.py
--- gallery-dl-1.23.2/gallery_dl/extractor/imagehosts.py	2022-10-01 10:19:13.000000000 +0000
+++ gallery-dl-1.24.0/gallery_dl/extractor/imagehosts.py	2022-11-11 08:37:30.000000000 +0000
@@ -54,6 +54,7 @@
 
         url, filename = self.get_info(page)
         data = text.nameext_from_url(filename, {"token": self.token})
+        data.update(self.metadata(page))
         if self.https and url.startswith("http:"):
             url = "https:" + url[5:]
 
@@ -63,6 +64,10 @@
     def get_info(self, page):
         """Find image-url and string to get filename from"""
 
+    def metadata(self, page):
+        """Return additional metadata"""
+        return ()
+
 
 class ImxtoImageExtractor(ImagehostImageExtractor):
     """Extractor for single images from imx.to"""
@@ -72,13 +77,23 @@
     test = (
         ("https://imx.to/i/1qdeva", {  # new-style URL
             "url": "ab2173088a6cdef631d7a47dec4a5da1c6a00130",
-            "keyword": "1153a986c939d7aed599905588f5c940048bc517",
             "content": "0c8768055e4e20e7c7259608b67799171b691140",
+            "keyword": {
+                "size"  : 18,
+                "width" : 64,
+                "height": 32,
+                "hash"  : "94d56c599223c59f3feb71ea603484d1",
+            },
         }),
         ("https://imx.to/img-57a2050547b97.html", {  # old-style URL
             "url": "a83fe6ef1909a318c4d49fcf2caf62f36c3f9204",
-            "keyword": "fd2240aee77a21b8252d5b829a1f7e542f927f09",
             "content": "54592f2635674c25677c6872db3709d343cdf92f",
+            "keyword": {
+                "size"  : 5284,
+                "width" : 320,
+                "height": 160,
+                "hash"  : "40da6aaa7b8c42b18ef74309bbc713fc",
+            },
         }),
         ("https://img.yt/img-57a2050547b97.html", {  # img.yt domain
             "url": "a83fe6ef1909a318c4d49fcf2caf62f36c3f9204",
@@ -108,6 +123,17 @@
             filename += splitext(url)[1]
         return url, filename or url
 
+    def metadata(self, page):
+        extr = text.extract_from(page, page.index("[ FILESIZE <"))
+        size = extr(">", "</span>").replace(" ", "")[:-1]
+        width, _, height = extr(">", " px</span>").partition("x")
+        return {
+            "size"  : text.parse_bytes(size),
+            "width" : text.parse_int(width),
+            "height": text.parse_int(height),
+            "hash"  : extr(">", "</span>"),
+        }
+
 
 class AcidimgImageExtractor(ImagehostImageExtractor):
     """Extractor for single images from acidimg.cc"""
@@ -259,7 +285,7 @@
     })
 
     def get_info(self, page):
-        url = text.extract(page, '<img src="', '"')[0]
+        url = text.extr(page, '<img src="', '"')
         return url, url
 
 
diff -Nru gallery-dl-1.23.2/gallery_dl/extractor/imgbb.py gallery-dl-1.24.0/gallery_dl/extractor/imgbb.py
--- gallery-dl-1.23.2/gallery_dl/extractor/imgbb.py	2022-05-03 10:22:33.000000000 +0000
+++ gallery-dl-1.24.0/gallery_dl/extractor/imgbb.py	2022-11-10 12:38:30.000000000 +0000
@@ -71,7 +71,7 @@
 
         url = self.root + "/login"
         page = self.request(url).text
-        token = text.extract(page, 'PF.obj.config.auth_token="', '"')[0]
+        token = text.extr(page, 'PF.obj.config.auth_token="', '"')
 
         headers = {"Referer": url}
         data = {
@@ -154,7 +154,7 @@
         }
 
     def images(self, page):
-        url = text.extract(page, '"og:url" content="', '"')[0]
+        url = text.extr(page, '"og:url" content="', '"')
         album_id = url.rpartition("/")[2].partition("?")[0]
 
         return self._pagination(page, "https://ibb.co/json", {
@@ -185,7 +185,7 @@
         return {"user": self.user}
 
     def images(self, page):
-        user = text.extract(page, '.obj.resource={"id":"', '"')[0]
+        user = text.extr(page, '.obj.resource={"id":"', '"')
         return self._pagination(page, self.page_url + "json", {
             "from"      : "user",
             "userid"    : user,
diff -Nru gallery-dl-1.23.2/gallery_dl/extractor/imgbox.py gallery-dl-1.24.0/gallery_dl/extractor/imgbox.py
--- gallery-dl-1.23.2/gallery_dl/extractor/imgbox.py	2022-05-03 10:22:33.000000000 +0000
+++ gallery-dl-1.24.0/gallery_dl/extractor/imgbox.py	2022-11-10 12:38:30.000000000 +0000
@@ -53,7 +53,7 @@
     @staticmethod
     def get_image_url(page):
         """Extract download-url"""
-        return text.extract(page, 'property="og:image" content="', '"')[0]
+        return text.extr(page, 'property="og:image" content="', '"')
 
 
 class ImgboxGalleryExtractor(AsynchronousMixin, ImgboxExtractor):
@@ -89,7 +89,7 @@
             raise exception.NotFoundError("gallery")
         self.image_keys = re.findall(r'<a href="/([^"]+)"><img alt="', page)
 
-        title = text.extract(page, "<h1>", "</h1>")[0]
+        title = text.extr(page, "<h1>", "</h1>")
         title, _, count = title.rpartition(" - ")
         return {
             "gallery_key": self.gallery_key,
diff -Nru gallery-dl-1.23.2/gallery_dl/extractor/imgth.py gallery-dl-1.24.0/gallery_dl/extractor/imgth.py
--- gallery-dl-1.23.2/gallery_dl/extractor/imgth.py	2022-02-01 23:09:19.000000000 +0000
+++ gallery-dl-1.24.0/gallery_dl/extractor/imgth.py	2022-11-10 12:38:30.000000000 +0000
@@ -41,7 +41,7 @@
         """Yield all image urls for this gallery"""
         pnum = 0
         while True:
-            thumbs = text.extract(page, '<ul class="thumbnails">', '</ul>')[0]
+            thumbs = text.extr(page, '<ul class="thumbnails">', '</ul>')
             for url in text.extract_iter(thumbs, '<img src="', '"'):
                 yield "https://imgth.com/images" + url[24:]
             if '<li class="next">' not in page:
diff -Nru gallery-dl-1.23.2/gallery_dl/extractor/__init__.py gallery-dl-1.24.0/gallery_dl/extractor/__init__.py
--- gallery-dl-1.23.2/gallery_dl/extractor/__init__.py	2022-10-01 10:34:23.000000000 +0000
+++ gallery-dl-1.24.0/gallery_dl/extractor/__init__.py	2022-11-15 11:32:45.000000000 +0000
@@ -10,12 +10,13 @@
 
 modules = [
     "2chan",
+    "2chen",
     "35photo",
     "3dbooru",
     "420chan",
     "4chan",
     "500px",
-    "8kun",
+    "8chan",
     "8muses",
     "adultempire",
     "architizer",
@@ -90,12 +91,13 @@
     "mememuseum",
     "myhentaigallery",
     "myportfolio",
+    "nana",
     "naver",
     "naverwebtoon",
     "newgrounds",
-    "ngomik",
     "nhentai",
     "nijie",
+    "nitter",
     "nozomi",
     "nsfwalbum",
     "paheal",
@@ -139,7 +141,9 @@
     "twibooru",
     "twitter",
     "unsplash",
+    "uploadir",
     "vanillarock",
+    "vichan",
     "vk",
     "vsco",
     "wallhaven",
@@ -149,7 +153,6 @@
     "webtoons",
     "weibo",
     "wikiart",
-    "wikieat",
     "xhamster",
     "xvideos",
     "zerochan",
diff -Nru gallery-dl-1.23.2/gallery_dl/extractor/inkbunny.py gallery-dl-1.24.0/gallery_dl/extractor/inkbunny.py
--- gallery-dl-1.23.2/gallery_dl/extractor/inkbunny.py	2022-05-03 10:22:33.000000000 +0000
+++ gallery-dl-1.24.0/gallery_dl/extractor/inkbunny.py	2022-11-10 12:38:30.000000000 +0000
@@ -236,7 +236,7 @@
             # get user_id from user profile
             url = "{}/{}".format(self.root, favsby)
             page = self.request(url).text
-            user_id = text.extract(page, "?user_id=", "'")[0]
+            user_id = text.extr(page, "?user_id=", "'")
             params["favs_user_id"] = user_id.partition("&")[0]
 
         return self.api.search(params)
diff -Nru gallery-dl-1.23.2/gallery_dl/extractor/instagram.py gallery-dl-1.24.0/gallery_dl/extractor/instagram.py
--- gallery-dl-1.23.2/gallery_dl/extractor/instagram.py	2022-09-30 21:22:36.000000000 +0000
+++ gallery-dl-1.24.0/gallery_dl/extractor/instagram.py	2022-11-19 10:08:42.000000000 +0000
@@ -12,8 +12,8 @@
 from .common import Extractor, Message
 from .. import text, util, exception
 from ..cache import cache, memcache
+import binascii
 import json
-import time
 import re
 
 BASE_PATTERN = r"(?:https?://)?(?:www\.)?instagram\.com"
@@ -44,14 +44,10 @@
     def items(self):
         self.login()
 
-        api = self.config("api")
-        if api is None or api == "auto":
-            api = InstagramRestAPI if self._logged_in else InstagramGraphqlAPI
-        elif api == "graphql":
-            api = InstagramGraphqlAPI
+        if self.config("api") == "graphql":
+            self.api = InstagramGraphqlAPI(self)
         else:
-            api = InstagramRestAPI
-        self.api = api(self)
+            self.api = InstagramRestAPI(self)
 
         data = self.metadata()
         videos = self.config("videos", True)
@@ -171,6 +167,15 @@
                 data["location_url"] = "{}/explore/locations/{}/{}/".format(
                     self.root, location["pk"], slug)
 
+            coauthors = post.get("coauthor_producers")
+            if coauthors:
+                data["coauthors"] = [
+                    {"id"       : user["pk"],
+                     "username" : user["username"],
+                     "full_name": user["full_name"]}
+                    for user in coauthors
+                ]
+
             if "carousel_media" in post:
                 items = post["carousel_media"]
                 data["sidecar_media_id"] = data["post_id"]
@@ -265,6 +270,14 @@
             data["location_url"] = "{}/explore/locations/{}/{}/".format(
                 self.root, location["id"], location["slug"])
 
+        coauthors = post.get("coauthor_producers")
+        if coauthors:
+            data["coauthors"] = [
+                {"id"      : user["id"],
+                 "username": user["username"]}
+                for user in coauthors
+            ]
+
         data["_files"] = files = []
         if "edge_sidecar_to_children" in post:
             for num, edge in enumerate(
@@ -338,6 +351,14 @@
                                          "username" : user["username"],
                                          "full_name": user["full_name"]})
 
+    def _init_cursor(self):
+        return self.config("cursor") or None
+
+    def _update_cursor(self, cursor):
+        self.log.debug("Cursor: %s", cursor)
+        self._cursor = cursor
+        return cursor
+
 
 class InstagramUserExtractor(InstagramExtractor):
     """Extractor for an Instagram user profile"""
@@ -353,12 +374,12 @@
         base = "{}/{}/".format(self.root, self.item)
         stories = "{}/stories/{}/".format(self.root, self.item)
         return self._dispatch_extractors((
+            (InstagramAvatarExtractor    , base + "avatar/"),
             (InstagramStoriesExtractor   , stories),
             (InstagramHighlightsExtractor, base + "highlights/"),
             (InstagramPostsExtractor     , base + "posts/"),
             (InstagramReelsExtractor     , base + "reels/"),
             (InstagramTaggedExtractor    , base + "tagged/"),
-            (InstagramChannelExtractor   , base + "channel/"),
         ), ("posts",))
 
 
@@ -409,8 +430,8 @@
             self.user_id = self.item[3:]
             return {"tagged_owner_id": self.user_id}
 
-        user = self.api.user(self.item)
-        self.user_id = user["id"]
+        self.user_id = self.api.user_id(self.item)
+        user = self.api.user_by_name(self.item)
 
         return {
             "tagged_owner_id" : user["id"],
@@ -422,18 +443,25 @@
         return self.api.user_tagged(self.user_id)
 
 
-class InstagramChannelExtractor(InstagramExtractor):
-    """Extractor for an Instagram user's channel posts"""
-    subcategory = "channel"
-    pattern = USER_PATTERN + r"/channel"
-    test = ("https://www.instagram.com/instagram/channel/", {
+class InstagramGuideExtractor(InstagramExtractor):
+    """Extractor for an Instagram guide"""
+    subcategory = "guide"
+    pattern = USER_PATTERN + r"/guide/[^/?#]+/(\d+)"
+    test = (("https://www.instagram.com/kadakaofficial/guide"
+             "/knit-i-need-collection/18131821684305217/"), {
         "range": "1-16",
         "count": ">= 16",
     })
 
+    def __init__(self, match):
+        InstagramExtractor.__init__(self, match)
+        self.guide_id = match.group(2)
+
+    def metadata(self):
+        return {"guide": self.api.guide(self.guide_id)}
+
     def posts(self):
-        uid = self.api.user_id(self.item)
-        return self.api.user_clips(uid)
+        return self.api.guide_media(self.guide_id)
 
 
 class InstagramSavedExtractor(InstagramExtractor):
@@ -475,25 +503,32 @@
     """Extractor for Instagram stories"""
     subcategory = "stories"
     pattern = (r"(?:https?://)?(?:www\.)?instagram\.com"
-               r"/stories/(?:highlights/(\d+)|([^/?#]+)(?:/(\d+))?)")
+               r"/s(?:tories/(?:highlights/(\d+)|([^/?#]+)(?:/(\d+))?)"
+               r"|/(aGlnaGxpZ2h0[^?#]+)(?:\?story_media_id=(\d+))?)")
     test = (
         ("https://www.instagram.com/stories/instagram/"),
         ("https://www.instagram.com/stories/highlights/18042509488170095/"),
         ("https://instagram.com/stories/geekmig/2724343156064789461"),
+        ("https://www.instagram.com/s/aGlnaGxpZ2h0OjE4MDQyNTA5NDg4MTcwMDk1"),
+        ("https://www.instagram.com/s/aGlnaGxpZ2h0OjE4MDQyNTA5NDg4MTcwMDk1"
+         "?story_media_id=2724343156064789461"),
     )
 
     def __init__(self, match):
-        self.highlight_id, self.user, self.media_id = match.groups()
-        if self.highlight_id:
+        h1, self.user, m1, h2, m2 = match.groups()
+
+        if self.user:
+            self.highlight_id = None
+        else:
             self.subcategory = InstagramHighlightsExtractor.subcategory
+            self.highlight_id = ("highlight:" + h1 if h1 else
+                                 binascii.a2b_base64(h2).decode())
+
+        self.media_id = m1 or m2
         InstagramExtractor.__init__(self, match)
 
     def posts(self):
-        if self.highlight_id:
-            reel_id = "highlight:" + self.highlight_id
-        else:
-            reel_id = self.api.user_id(self.user)
-
+        reel_id = self.highlight_id or self.api.user_id(self.user)
         reels = self.api.reels_media(reel_id)
 
         if self.media_id and reels:
@@ -536,6 +571,48 @@
         return self.api.tags_media(self.item)
 
 
+class InstagramAvatarExtractor(InstagramExtractor):
+    """Extractor for an Instagram user's avatar"""
+    subcategory = "avatar"
+    pattern = USER_PATTERN + r"/avatar"
+    test = ("https://www.instagram.com/instagram/avatar", {
+        "pattern": r"https://instagram\.[\w.-]+\.fbcdn\.net/v/t51\.2885-19"
+                   r"/281440578_1088265838702675_6233856337905829714_n\.jpg",
+    })
+
+    def posts(self):
+        if self._logged_in:
+            user_id = self.api.user_id(self.item, check_private=False)
+            user = self.api.user_by_id(user_id)
+            avatar = (user.get("hd_profile_pic_url_info") or
+                      user["hd_profile_pic_versions"][-1])
+        else:
+            user = self.item
+            if user.startswith("id:"):
+                user = self.api.user_by_id(user[3:])
+            else:
+                user = self.api.user_by_name(user)
+                user["pk"] = user["id"]
+            url = user.get("profile_pic_url_hd") or user["profile_pic_url"]
+            avatar = {"url": url, "width": 0, "height": 0}
+
+        pk = user.get("profile_pic_id")
+        if pk:
+            pk = pk.partition("_")[0]
+            code = shortcode_from_id(pk)
+        else:
+            pk = code = "avatar:" + str(user["pk"])
+
+        return ({
+            "pk"        : pk,
+            "code"      : code,
+            "user"      : user,
+            "caption"   : None,
+            "like_count": 0,
+            "image_versions2": {"candidates": (avatar,)},
+        },)
+
+
 class InstagramPostExtractor(InstagramExtractor):
     """Extractor for an Instagram post"""
     subcategory = "post"
@@ -647,6 +724,15 @@
     def __init__(self, extractor):
         self.extractor = extractor
 
+    def guide(self, guide_id):
+        endpoint = "/v1/guides/web_info/"
+        params = {"guide_id": guide_id}
+        return self._call(endpoint, params=params)
+
+    def guide_media(self, guide_id):
+        endpoint = "/v1/guides/guide/{}/".format(guide_id)
+        return self._pagination_guides(endpoint)
+
     def highlights_media(self, user_id):
         chunk_size = 5
         reel_ids = [hl["id"] for hl in self.highlights_tray(user_id)]
@@ -685,15 +771,28 @@
         return self._pagination_sections(endpoint, data)
 
     @memcache(keyarg=1)
-    def user(self, screen_name):
+    def user_by_name(self, screen_name):
         endpoint = "/v1/users/web_profile_info/"
         params = {"username": screen_name}
         return self._call(endpoint, params=params)["data"]["user"]
 
-    def user_id(self, screen_name):
+    def user_by_id(self, user_id):
+        endpoint = "/v1/users/{}/info/".format(user_id)
+        return self._call(endpoint)["user"]
+
+    def user_id(self, screen_name, check_private=True):
         if screen_name.startswith("id:"):
             return screen_name[3:]
-        return self.user(screen_name)["id"]
+        user = self.user_by_name(screen_name)
+        if user is None:
+            raise exception.AuthorizationError(
+                "Login required to access this profile")
+        if check_private and user["is_private"] and \
+                not user["followed_by_viewer"]:
+            name = user["username"]
+            s = "" if name.endswith("s") else "s"
+            raise exception.StopExtraction("%s'%s posts are private", name, s)
+        return user["id"]
 
     def user_clips(self, user_id):
         endpoint = "/v1/clips/user/"
@@ -741,6 +840,9 @@
     def _pagination(self, endpoint, params=None, media=False):
         if params is None:
             params = {}
+        extr = self.extractor
+        params["max_id"] = extr._init_cursor()
+
         while True:
             data = self._call(endpoint, params=params)
 
@@ -752,9 +854,12 @@
 
             if not data.get("more_available"):
                 return
-            params["max_id"] = data["next_max_id"]
+            params["max_id"] = extr._update_cursor(data["next_max_id"])
 
     def _pagination_post(self, endpoint, params):
+        extr = self.extractor
+        params["max_id"] = extr._init_cursor()
+
         while True:
             data = self._call(endpoint, method="POST", data=params)
 
@@ -764,9 +869,12 @@
             info = data["paging_info"]
             if not info.get("more_available"):
                 return
-            params["max_id"] = info["max_id"]
+            params["max_id"] = extr._update_cursor(info["max_id"])
 
     def _pagination_sections(self, endpoint, params):
+        extr = self.extractor
+        params["max_id"] = extr._init_cursor()
+
         while True:
             info = self._call(endpoint, method="POST", data=params)
 
@@ -774,22 +882,41 @@
 
             if not info.get("more_available"):
                 return
-            params["max_id"] = info["next_max_id"]
             params["page"] = info["next_page"]
+            params["max_id"] = extr._update_cursor(info["next_max_id"])
+
+    def _pagination_guides(self, endpoint):
+        extr = self.extractor
+        params = {"max_id": extr._init_cursor()}
+
+        while True:
+            data = self._call(endpoint, params=params)
+
+            for item in data["items"]:
+                yield from item["media_items"]
+
+            if "next_max_id" not in data:
+                return
+            params["max_id"] = extr._update_cursor(data["next_max_id"])
 
 
 class InstagramGraphqlAPI():
 
     def __init__(self, extractor):
         self.extractor = extractor
-        self.user = InstagramRestAPI(extractor).user
         self.user_collection = self.user_saved = self.reels_media = \
-            self.highlights_media = self._login_required
+            self.highlights_media = self.guide = self.guide_media = \
+            self._unsupported
         self._json_dumps = json.JSONEncoder(separators=(",", ":")).encode
 
+        api = InstagramRestAPI(extractor)
+        self.user_by_name = api.user_by_name
+        self.user_by_id = api.user_by_id
+        self.user_id = api.user_id
+
     @staticmethod
-    def _login_required(_=None):
-        raise exception.AuthorizationError("Login required")
+    def _unsupported(_=None):
+        raise exception.StopExtraction("Unsupported with GraphQL API")
 
     def highlights_tray(self, user_id):
         query_hash = "d4d88dc1500312af6f937f7b804c68c3"
@@ -824,11 +951,6 @@
         return self._pagination(query_hash, variables,
                                 "hashtag", "edge_hashtag_to_media")
 
-    def user_id(self, screen_name):
-        if screen_name.startswith("id:"):
-            return screen_name[3:]
-        return self.user(screen_name)["id"]
-
     def user_clips(self, user_id):
         query_hash = "bc78b344a68ed16dd5d7f264681c4c76"
         variables = {"id": user_id, "first": 50}
@@ -871,9 +993,8 @@
 
     def _pagination(self, query_hash, variables,
                     key_data="user", key_edge=None):
-        cursor = self.extractor.config("cursor")
-        if cursor:
-            variables["after"] = cursor
+        extr = self.extractor
+        variables["after"] = extr._init_cursor()
 
         while True:
             data = self._call(query_hash, variables)[key_data]
@@ -890,51 +1011,14 @@
                 raise exception.StopExtraction(
                     "%s'%s posts are private", self.item, s)
 
-            variables["after"] = self._cursor = info["end_cursor"]
-            self.extractor.log.debug("Cursor: %s", self._cursor)
+            variables["after"] = extr._update_cursor(info["end_cursor"])
 
 
-@cache(maxage=360*24*3600, keyarg=1)
+@cache(maxage=90*24*3600, keyarg=1)
 def _login_impl(extr, username, password):
-    extr.log.info("Logging in as %s", username)
-
-    url = extr.root + "/accounts/login/"
-    page = extr.request(url).text
-
-    headers = {
-        "X-Web-Device-Id" : text.extract(page, '"device_id":"', '"')[0],
-        "X-IG-App-ID"     : "936619743392459",
-        "X-ASBD-ID"       : "437806",
-        "X-IG-WWW-Claim"  : "0",
-        "X-Requested-With": "XMLHttpRequest",
-        "Referer"         : url,
-    }
-    url = extr.root + "/data/shared_data/"
-    data = extr.request(url, headers=headers).json()
-
-    headers["X-CSRFToken"] = data["config"]["csrf_token"]
-    headers["X-Instagram-AJAX"] = data["rollout_hash"]
-    headers["Origin"] = extr.root
-    data = {
-        "username"     : username,
-        "enc_password" : "#PWD_INSTAGRAM_BROWSER:0:{}:{}".format(
-            int(time.time()), password),
-        "queryParams"         : "{}",
-        "optIntoOneTap"       : "false",
-        "stopDeletionNonce"   : "",
-        "trustedDeviceRecords": "{}",
-    }
-    url = extr.root + "/accounts/login/ajax/"
-    response = extr.request(url, method="POST", headers=headers, data=data)
-
-    if not response.json().get("authenticated"):
-        raise exception.AuthenticationError()
-
-    cget = extr.session.cookies.get
-    return {
-        name: cget(name)
-        for name in ("sessionid", "mid", "ig_did")
-    }
+    extr.log.error("Login with username & password is no longer supported. "
+                   "Use browser cookies instead.")
+    return {}
 
 
 def id_from_shortcode(shortcode):
diff -Nru gallery-dl-1.23.2/gallery_dl/extractor/issuu.py gallery-dl-1.24.0/gallery_dl/extractor/issuu.py
--- gallery-dl-1.23.2/gallery_dl/extractor/issuu.py	2022-05-30 10:58:03.000000000 +0000
+++ gallery-dl-1.24.0/gallery_dl/extractor/issuu.py	2022-11-10 12:38:30.000000000 +0000
@@ -54,8 +54,8 @@
     })
 
     def metadata(self, page):
-        data = json.loads(text.extract(
-            page, '<script data-json="', '"')[0].replace("&quot;", '"'))
+        data = json.loads(text.extr(
+            page, '<script data-json="', '"').replace("&quot;", '"'))
 
         doc = data["initialDocumentData"]["document"]
         doc["date"] = text.parse_datetime(
diff -Nru gallery-dl-1.23.2/gallery_dl/extractor/kabeuchi.py gallery-dl-1.24.0/gallery_dl/extractor/kabeuchi.py
--- gallery-dl-1.23.2/gallery_dl/extractor/kabeuchi.py	2021-12-11 02:38:22.000000000 +0000
+++ gallery-dl-1.24.0/gallery_dl/extractor/kabeuchi.py	2022-11-10 12:38:30.000000000 +0000
@@ -62,7 +62,7 @@
         response = self.request(url)
         if response.history and response.url == self.root + "/":
             raise exception.NotFoundError("user")
-        target_id = text.extract(response.text, 'user_friend_id = "', '"')[0]
+        target_id = text.extr(response.text, 'user_friend_id = "', '"')
         return self._pagination(target_id)
 
     def _pagination(self, target_id):
diff -Nru gallery-dl-1.23.2/gallery_dl/extractor/keenspot.py gallery-dl-1.24.0/gallery_dl/extractor/keenspot.py
--- gallery-dl-1.23.2/gallery_dl/extractor/keenspot.py	2022-05-03 10:22:33.000000000 +0000
+++ gallery-dl-1.24.0/gallery_dl/extractor/keenspot.py	2022-11-10 12:38:30.000000000 +0000
@@ -96,7 +96,7 @@
             self._image = '<div id="comic">'
             return "http://brawlinthefamily.keenspot.com/comic/theshowdown/"
 
-        url = text.extract(page, '<link rel="first" href="', '"')[0]
+        url = text.extr(page, '<link rel="first" href="', '"')
         if url:
             if self.comic == "porcelain":
                 self._needle = 'id="porArchivetop_"'
@@ -144,7 +144,7 @@
 
     @staticmethod
     def _next_link(page):
-        return text.extract(page, '<link rel="next" href="', '"')[0]
+        return text.extr(page, '<link rel="next" href="', '"')
 
     @staticmethod
     def _next_id(page):
diff -Nru gallery-dl-1.23.2/gallery_dl/extractor/kemonoparty.py gallery-dl-1.24.0/gallery_dl/extractor/kemonoparty.py
--- gallery-dl-1.23.2/gallery_dl/extractor/kemonoparty.py	2022-10-01 10:05:37.000000000 +0000
+++ gallery-dl-1.24.0/gallery_dl/extractor/kemonoparty.py	2022-11-10 12:38:30.000000000 +0000
@@ -190,9 +190,9 @@
         for dm in text.extract_iter(page, "<article", "</article>"):
             dms.append({
                 "body": text.unescape(text.extract(
-                    dm, '<pre>', '</pre></section>',
+                    dm, "<pre>", "</pre></",
                 )[0].strip()),
-                "date": text.extract(dm, 'datetime="', '"')[0],
+                "date": text.extr(dm, 'datetime="', '"'),
             })
         return dms
 
@@ -230,9 +230,10 @@
             posts = self.request(url, params=params).json()
             yield from posts
 
-            if len(posts) < 25:
+            cnt = len(posts)
+            if cnt < 25:
                 return
-            params["o"] += 25
+            params["o"] += cnt
 
 
 class KemonopartyPostExtractor(KemonopartyExtractor):
@@ -420,9 +421,10 @@
             posts = self.request(url, params=params).json()
             yield from posts
 
-            if len(posts) < 25:
+            cnt = len(posts)
+            if cnt < 25:
                 break
-            params["skip"] += 25
+            params["skip"] += cnt
 
 
 class KemonopartyDiscordServerExtractor(KemonopartyExtractor):
diff -Nru gallery-dl-1.23.2/gallery_dl/extractor/khinsider.py gallery-dl-1.24.0/gallery_dl/extractor/khinsider.py
--- gallery-dl-1.23.2/gallery_dl/extractor/khinsider.py	2022-07-12 16:31:03.000000000 +0000
+++ gallery-dl-1.24.0/gallery_dl/extractor/khinsider.py	2022-11-15 11:33:08.000000000 +0000
@@ -23,9 +23,9 @@
     root = "https://downloads.khinsider.com"
     test = (("https://downloads.khinsider.com"
              "/game-soundtracks/album/horizon-riders-wii"), {
-        "pattern": r"https?://vgm(site|downloads).com"
+        "pattern": r"https?://vgm(site|downloads)\.com"
                    r"/soundtracks/horizon-riders-wii/[^/]+"
-                   r"/Horizon%20Riders%20Wii%20-%20Full%20Soundtrack.mp3",
+                   r"/Horizon%20Riders%20Wii%20-%20Full%20Soundtrack\.mp3",
         "keyword": {
             "album": {
                 "count": 1,
@@ -76,15 +76,14 @@
             else:
                 fmt = fmt.lower().split(",")
 
-        page = text.extract(page, '<table id="songlist">', '</table>')[0]
+        page = text.extr(page, '<table id="songlist">', '</table>')
         for num, url in enumerate(text.extract_iter(
                 page, '<td class="clickable-row"><a href="', '"'), 1):
             url = text.urljoin(self.root, url)
             page = self.request(url, encoding="utf-8").text
             track = first = None
 
-            for url in text.extract_iter(
-                    page, 'style="color: #21363f;" href="', '"'):
+            for url in text.extract_iter(page, '<p><a href="', '"'):
                 track = text.nameext_from_url(url, {"num": num, "url": url})
                 if first is None:
                     first = track
diff -Nru gallery-dl-1.23.2/gallery_dl/extractor/kissgoddess.py gallery-dl-1.24.0/gallery_dl/extractor/kissgoddess.py
--- gallery-dl-1.23.2/gallery_dl/extractor/kissgoddess.py	2022-05-30 10:58:03.000000000 +0000
+++ gallery-dl-1.24.0/gallery_dl/extractor/kissgoddess.py	2022-11-10 12:38:30.000000000 +0000
@@ -35,8 +35,8 @@
     def metadata(self, page):
         return {
             "gallery_id": text.parse_int(self.gallery_id),
-            "title"     : text.extract(
-                page, '<title>', "<")[0].rpartition(" | ")[0],
+            "title"     : text.extr(
+                page, '<title>', "<")[0].rpartition(" | "),
         }
 
     def images(self, page):
diff -Nru gallery-dl-1.23.2/gallery_dl/extractor/komikcast.py gallery-dl-1.24.0/gallery_dl/extractor/komikcast.py
--- gallery-dl-1.23.2/gallery_dl/extractor/komikcast.py	2022-07-12 21:07:25.000000000 +0000
+++ gallery-dl-1.24.0/gallery_dl/extractor/komikcast.py	2022-11-10 12:38:30.000000000 +0000
@@ -62,13 +62,13 @@
     )
 
     def metadata(self, page):
-        info = text.extract(page, "<title>", " – Komikcast<")[0]
+        info = text.extr(page, "<title>", " – Komikcast<")
         return self.parse_chapter_string(info)
 
     @staticmethod
     def images(page):
-        readerarea = text.extract(
-            page, '<div class="main-reading-area', '</div')[0]
+        readerarea = text.extr(
+            page, '<div class="main-reading-area', '</div')
         return [
             (text.unescape(url), None)
             for url in re.findall(r"<img[^>]* src=[\"']([^\"']+)", readerarea)
diff -Nru gallery-dl-1.23.2/gallery_dl/extractor/lightroom.py gallery-dl-1.24.0/gallery_dl/extractor/lightroom.py
--- gallery-dl-1.23.2/gallery_dl/extractor/lightroom.py	2022-05-03 10:22:33.000000000 +0000
+++ gallery-dl-1.24.0/gallery_dl/extractor/lightroom.py	2022-11-10 12:38:30.000000000 +0000
@@ -47,7 +47,7 @@
         url = "https://lightroom.adobe.com/shares/" + self.href
         response = self.request(url)
         album = json.loads(
-            text.extract(response.text, "albumAttributes: ", "\n")[0]
+            text.extr(response.text, "albumAttributes: ", "\n")
         )
 
         images = self.images(album)
diff -Nru gallery-dl-1.23.2/gallery_dl/extractor/lineblog.py gallery-dl-1.24.0/gallery_dl/extractor/lineblog.py
--- gallery-dl-1.23.2/gallery_dl/extractor/lineblog.py	2021-12-11 02:38:22.000000000 +0000
+++ gallery-dl-1.24.0/gallery_dl/extractor/lineblog.py	2022-11-10 12:38:30.000000000 +0000
@@ -22,8 +22,8 @@
         body = post.pop("body")
 
         for num, img in enumerate(text.extract_iter(body, "<img ", ">"), 1):
-            src = text.extract(img, 'src="', '"')[0]
-            alt = text.extract(img, 'alt="', '"')[0]
+            src = text.extr(img, 'src="', '"')
+            alt = text.extr(img, 'alt="', '"')
 
             if not src:
                 continue
diff -Nru gallery-dl-1.23.2/gallery_dl/extractor/livedoor.py gallery-dl-1.24.0/gallery_dl/extractor/livedoor.py
--- gallery-dl-1.23.2/gallery_dl/extractor/livedoor.py	2022-02-01 23:09:19.000000000 +0000
+++ gallery-dl-1.24.0/gallery_dl/extractor/livedoor.py	2022-11-10 12:38:30.000000000 +0000
@@ -37,7 +37,7 @@
 
     def _load(self, data, body):
         extr = text.extract_from(data)
-        tags = text.extract(body, 'class="article-tags">', '</dl>')[0]
+        tags = text.extr(body, 'class="article-tags">', '</dl>')
         about = extr('rdf:about="', '"')
 
         return {
@@ -57,8 +57,8 @@
         body = post.pop("body")
 
         for num, img in enumerate(text.extract_iter(body, "<img ", ">"), 1):
-            src = text.extract(img, 'src="', '"')[0]
-            alt = text.extract(img, 'alt="', '"')[0]
+            src = text.extr(img, 'src="', '"')
+            alt = text.extr(img, 'alt="', '"')
 
             if not src:
                 continue
diff -Nru gallery-dl-1.23.2/gallery_dl/extractor/lolisafe.py gallery-dl-1.24.0/gallery_dl/extractor/lolisafe.py
--- gallery-dl-1.23.2/gallery_dl/extractor/lolisafe.py	2022-07-14 20:26:30.000000000 +0000
+++ gallery-dl-1.24.0/gallery_dl/extractor/lolisafe.py	2022-11-10 12:38:30.000000000 +0000
@@ -24,6 +24,10 @@
         "root": "https://zz.ht",
         "pattern": r"zz\.(?:ht|fo)",
     },
+    "xbunkr": {
+        "root": "https://xbunkr.com",
+        "pattern": r"xbunkr\.com",
+    }
 })
 
 
@@ -40,6 +44,15 @@
             },
         }),
         ("https://zz.fo/a/lop7W6EZ"),
+        ("https://xbunkr.com/a/TA0bu3F4", {
+            "pattern": r"https://media\.xbunkr\.com/[^.]+\.\w+",
+            "count": 861,
+            "keyword": {
+                "album_id": "TA0bu3F4",
+                "album_name": "Hannahowo Onlyfans Photos",
+            }
+        }),
+        ("https://xbunkr.com/a/GNQc2I5d"),
     )
 
     def __init__(self, match):
diff -Nru gallery-dl-1.23.2/gallery_dl/extractor/manganelo.py gallery-dl-1.24.0/gallery_dl/extractor/manganelo.py
--- gallery-dl-1.23.2/gallery_dl/extractor/manganelo.py	2022-07-12 13:49:22.000000000 +0000
+++ gallery-dl-1.24.0/gallery_dl/extractor/manganelo.py	2022-11-10 12:38:30.000000000 +0000
@@ -11,21 +11,22 @@
 import re
 
 BASE_PATTERN = \
-    r"(?:https?://)?((?:(?:read)?manganato|(?:www\.)?manganelo)\.com)"
+    r"(?:https?://)?((?:(?:chap|read)?manganato|(?:www\.)?manganelo)\.com)"
 
 
 class ManganeloChapterExtractor(ChapterExtractor):
     """Extractor for manga-chapters from manganelo.com"""
     category = "manganelo"
-    root = "https://readmanganato.com"
+    root = "https://chapmanganato.com"
     pattern = BASE_PATTERN + r"(/(?:manga-\w+|chapter/\w+)/chapter[-_][^/?#]+)"
     test = (
-        ("https://readmanganato.com/manga-gn983696/chapter-23", {
+        ("https://chapmanganato.com/manga-gn983696/chapter-23", {
             "pattern": r"https://v\d+\.mkklcdnv6tempv5\.com/img/tab_17/03/23"
                        r"/39/gn983696/vol_3_chapter_23_24_yen/\d+-[no]\.jpg",
             "keyword": "2c5cd59342f149375df9bcb50aa416b4d04a43cf",
             "count": 25,
         }),
+        ("https://readmanganato.com/manga-gn983696/chapter-23"),
         ("https://manganelo.com/chapter/gamers/chapter_15"),
         ("https://manganelo.com/chapter/gq921227/chapter_23"),
     )
@@ -62,8 +63,8 @@
         }
 
     def images(self, page):
-        page = text.extract(
-            page, 'class="container-chapter-reader', '\n<div')[0]
+        page = text.extr(
+            page, 'class="container-chapter-reader', '\n<div')
         return [
             (url, None)
             for url in text.extract_iter(page, '<img src="', '"')
@@ -73,14 +74,15 @@
 class ManganeloMangaExtractor(MangaExtractor):
     """Extractor for manga from manganelo.com"""
     category = "manganelo"
-    root = "https://readmanganato.com"
+    root = "https://chapmanganato.com"
     chapterclass = ManganeloChapterExtractor
     pattern = BASE_PATTERN + r"(/(?:manga[-/]|read_)\w+)/?$"
     test = (
-        ("https://readmanganato.com/manga-gn983696", {
+        ("https://chapmanganato.com/manga-gn983696", {
             "pattern": ManganeloChapterExtractor.pattern,
             "count": ">= 25",
         }),
+        ("https://readmanganato.com/manga-gn983696"),
         ("https://manganelo.com/manga/read_otome_no_teikoku"),
         ("https://manganelo.com/manga/ol921234/"),
     )
diff -Nru gallery-dl-1.23.2/gallery_dl/extractor/mangapark.py gallery-dl-1.24.0/gallery_dl/extractor/mangapark.py
--- gallery-dl-1.23.2/gallery_dl/extractor/mangapark.py	2022-09-12 10:03:41.000000000 +0000
+++ gallery-dl-1.24.0/gallery_dl/extractor/mangapark.py	2022-11-10 12:38:30.000000000 +0000
@@ -104,7 +104,7 @@
         return data
 
     def images(self, page):
-        data = json.loads(text.extract(page, "var _load_pages =", ";")[0])
+        data = json.loads(text.extr(page, "var _load_pages =", ";"))
         return [
             (text.urljoin(self.root, item["u"]), {
                 "width": text.parse_int(item["w"]),
@@ -136,10 +136,10 @@
         results = []
         data = {"lang": "en", "language": "English"}
         data["manga"] = text.unescape(
-            text.extract(page, '<title>', ' Manga - ')[0])
+            text.extr(page, '<title>', ' Manga - '))
 
         for stream in page.split('<div id="stream_')[1:]:
-            data["stream"] = text.parse_int(text.extract(stream, '', '"')[0])
+            data["stream"] = text.parse_int(text.extr(stream, '', '"'))
 
             for chapter in text.extract_iter(stream, '<li ', '</li>'):
                 path  , pos = text.extract(chapter, 'href="', '"')
diff -Nru gallery-dl-1.23.2/gallery_dl/extractor/mangasee.py gallery-dl-1.24.0/gallery_dl/extractor/mangasee.py
--- gallery-dl-1.23.2/gallery_dl/extractor/mangasee.py	2022-05-30 10:58:03.000000000 +0000
+++ gallery-dl-1.24.0/gallery_dl/extractor/mangasee.py	2022-11-08 16:10:24.000000000 +0000
@@ -35,33 +35,59 @@
 
 
 class MangaseeChapterExtractor(MangaseeBase, ChapterExtractor):
-    pattern = r"(?:https?://)?mangasee123\.com(/read-online/[^/?#]+\.html)"
-    test = (("https://mangasee123.com/read-online"
-             "/Tokyo-Innocent-chapter-4.5-page-1.html"), {
-        "pattern": r"https://[^/]+/manga/Tokyo-Innocent/0004\.5-00\d\.png",
-        "count": 8,
-        "keyword": {
-            "chapter": 4,
-            "chapter_minor": ".5",
-            "chapter_string": "100045",
+    pattern = (r"(?:https?://)?(mangasee123|manga4life)\.com"
+               r"(/read-online/[^/?#]+\.html)")
+    test = (
+        (("https://mangasee123.com/read-online"
+          "/Tokyo-Innocent-chapter-4.5-page-1.html"), {
+            "pattern": r"https://[^/]+/manga/Tokyo-Innocent/0004\.5-00\d\.png",
             "count": 8,
-            "date": "dt:2020-01-20 21:52:53",
-            "extension": "png",
-            "filename": r"re:0004\.5-00\d",
-            "index": "1",
-            "lang": "en",
-            "language": "English",
-            "manga": "Tokyo Innocent",
-            "page": int,
-            "title": "",
-        },
-    })
+            "keyword": {
+                "chapter": 4,
+                "chapter_minor": ".5",
+                "chapter_string": "100045",
+                "count": 8,
+                "date": "dt:2020-01-20 21:52:53",
+                "extension": "png",
+                "filename": r"re:0004\.5-00\d",
+                "index": "1",
+                "lang": "en",
+                "language": "English",
+                "manga": "Tokyo Innocent",
+                "page": int,
+                "title": "",
+            },
+        }),
+        (("https://manga4life.com/read-online"
+          "/One-Piece-chapter-1063-page-1.html"), {
+            "pattern": r"https://[^/]+/manga/One-Piece/1063-0\d\d\.png",
+            "count": 13,
+            "keyword": {
+                "chapter": 1063,
+                "chapter_minor": "",
+                "chapter_string": "110630",
+                "count": 13,
+                "date": "dt:2022-10-16 17:32:54",
+                "extension": "png",
+                "filename": r"re:1063-0\d\d",
+                "index": "1",
+                "lang": "en",
+                "language": "English",
+                "manga": "One Piece",
+                "page": int,
+                "title": "",
+            },
+        }),
+    )
 
     def __init__(self, match):
-        ChapterExtractor.__init__(self, match)
+        if match.group(1) == "manga4life":
+            self.category = "mangalife"
+            self.root = "https://manga4life.com"
+        ChapterExtractor.__init__(self, match, self.root + match.group(2))
         self.session.headers["Referer"] = self.gallery_url
 
-        domain = "mangasee123.com"
+        domain = self.root.rpartition("/")[2]
         cookies = self.session.cookies
         if not cookies.get("PHPSESSID", domain=domain):
             cookies.set("PHPSESSID", util.generate_token(13), domain=domain)
@@ -96,12 +122,24 @@
 
 class MangaseeMangaExtractor(MangaseeBase, MangaExtractor):
     chapterclass = MangaseeChapterExtractor
-    pattern = r"(?:https?://)?mangasee123\.com(/manga/[^/?#]+)"
-    test = (("https://mangasee123.com/manga"
-             "/Nakamura-Koedo-To-Daizu-Keisuke-Wa-Umaku-Ikanai"), {
-        "pattern": MangaseeChapterExtractor.pattern,
-        "count": ">= 17",
-    })
+    pattern = r"(?:https?://)?(mangasee123|manga4life)\.com(/manga/[^/?#]+)"
+    test = (
+        (("https://mangasee123.com/manga"
+          "/Nakamura-Koedo-To-Daizu-Keisuke-Wa-Umaku-Ikanai"), {
+            "pattern": MangaseeChapterExtractor.pattern,
+            "count": ">= 17",
+        }),
+        ("https://manga4life.com/manga/Ano-Musume-Ni-Kiss-To-Shirayuri-O", {
+            "pattern": MangaseeChapterExtractor.pattern,
+            "count": ">= 50",
+        }),
+    )
+
+    def __init__(self, match):
+        if match.group(1) == "manga4life":
+            self.category = "mangalife"
+            self.root = "https://manga4life.com"
+        MangaExtractor.__init__(self, match, self.root + match.group(2))
 
     def chapters(self, page):
         slug, pos = text.extract(page, 'vm.IndexName = "', '"')
diff -Nru gallery-dl-1.23.2/gallery_dl/extractor/mangoxo.py gallery-dl-1.24.0/gallery_dl/extractor/mangoxo.py
--- gallery-dl-1.23.2/gallery_dl/extractor/mangoxo.py	2022-05-03 10:22:33.000000000 +0000
+++ gallery-dl-1.24.0/gallery_dl/extractor/mangoxo.py	2022-11-10 12:38:30.000000000 +0000
@@ -38,7 +38,7 @@
 
         url = self.root + "/login"
         page = self.request(url).text
-        token = text.extract(page, 'id="loginToken" value="', '"')[0]
+        token = text.extr(page, 'id="loginToken" value="', '"')
 
         url = self.root + "/api/login"
         headers = {
@@ -115,7 +115,7 @@
 
         data["extension"] = None
         for data["num"], path in enumerate(imgs, 1):
-            data["id"] = text.parse_int(text.extract(path, "=", "&")[0])
+            data["id"] = text.parse_int(text.extr(path, "=", "&"))
             url = self.root + "/external/" + path.rpartition("url=")[2]
             yield Message.Url, url, text.nameext_from_url(url, data)
 
diff -Nru gallery-dl-1.23.2/gallery_dl/extractor/mastodon.py gallery-dl-1.24.0/gallery_dl/extractor/mastodon.py
--- gallery-dl-1.23.2/gallery_dl/extractor/mastodon.py	2022-09-30 14:46:45.000000000 +0000
+++ gallery-dl-1.24.0/gallery_dl/extractor/mastodon.py	2022-11-10 12:38:30.000000000 +0000
@@ -44,6 +44,10 @@
             del status["media_attachments"]
 
             status["instance"] = self.instance
+            acct = status["account"]["acct"]
+            status["instance_remote"] = \
+                acct.rpartition("@")[2] if "@" in acct else None
+
             status["tags"] = [tag["name"] for tag in status["tags"]]
             status["date"] = text.parse_datetime(
                 status["created_at"][:19], "%Y-%m-%dT%H:%M:%S")
@@ -92,7 +96,7 @@
     }
 }
 
-BASE_PATTERN = MastodonExtractor.update(INSTANCES)
+BASE_PATTERN = MastodonExtractor.update(INSTANCES) + "(?:/web)?"
 
 
 class MastodonUserExtractor(MastodonExtractor):
@@ -111,9 +115,16 @@
             "count": 60,
         }),
         ("https://baraag.net/@pumpkinnsfw"),
+        ("https://mastodon.social/@yoru_nine@pawoo.net", {
+            "pattern": r"https://mastodon\.social/media_proxy/\d+/original",
+            "range": "1-10",
+            "count": 10,
+        }),
         ("https://mastodon.social/@id:10843"),
         ("https://mastodon.social/users/id:10843"),
         ("https://mastodon.social/users/jk"),
+        ("https://mastodon.social/users/yoru_nine@pawoo.net"),
+        ("https://mastodon.social/web/@jk"),
     )
 
     def statuses(self):
@@ -126,6 +137,20 @@
         )
 
 
+class MastodonBookmarkExtractor(MastodonExtractor):
+    """Extractor for mastodon bookmarks"""
+    subcategory = "bookmark"
+    pattern = BASE_PATTERN + r"/bookmarks"
+    test = (
+        ("https://mastodon.social/bookmarks"),
+        ("https://pawoo.net/bookmarks"),
+        ("https://baraag.net/bookmarks"),
+    )
+
+    def statuses(self):
+        return MastodonAPI(self).account_bookmarks()
+
+
 class MastodonFollowingExtractor(MastodonExtractor):
     """Extractor for followed mastodon users"""
     subcategory = "following"
@@ -197,13 +222,21 @@
         if username.startswith("id:"):
             return username[3:]
 
-        handle = "@{}@{}".format(username, self.extractor.instance)
+        if "@" in username:
+            handle = "@" + username
+        else:
+            handle = "@{}@{}".format(username, self.extractor.instance)
+
         for account in self.account_search(handle, 1):
-            if account["username"] == username:
+            if account["acct"] == username:
                 self.extractor._check_move(account)
                 return account["id"]
         raise exception.NotFoundError("account")
 
+    def account_bookmarks(self):
+        endpoint = "/v1/bookmarks"
+        return self._pagination(endpoint, None)
+
     def account_following(self, account_id):
         endpoint = "/v1/accounts/{}/following".format(account_id)
         return self._pagination(endpoint, None)
diff -Nru gallery-dl-1.23.2/gallery_dl/extractor/moebooru.py gallery-dl-1.24.0/gallery_dl/extractor/moebooru.py
--- gallery-dl-1.23.2/gallery_dl/extractor/moebooru.py	2022-05-31 10:15:23.000000000 +0000
+++ gallery-dl-1.24.0/gallery_dl/extractor/moebooru.py	2022-11-10 12:38:30.000000000 +0000
@@ -26,17 +26,38 @@
     def _prepare(post):
         post["date"] = text.parse_timestamp(post["created_at"])
 
-    def _extended_tags(self, post):
-        url = "{}/post/show/{}".format(self.root, post["id"])
-        page = self.request(url).text
-        html = text.extract(page, '<ul id="tag-', '</ul>')[0]
-        if html:
-            tags = collections.defaultdict(list)
-            pattern = re.compile(r"tag-type-([^\"' ]+).*?[?;]tags=([^\"'+]+)")
-            for tag_type, tag_name in pattern.findall(html):
-                tags[tag_type].append(text.unquote(tag_name))
-            for key, value in tags.items():
-                post["tags_" + key] = " ".join(value)
+    def _html(self, post):
+        return self.request("{}/post/show/{}".format(
+            self.root, post["id"])).text
+
+    def _tags(self, post, page):
+        tag_container = text.extr(page, '<ul id="tag-', '</ul>')
+        if not tag_container:
+            return
+
+        tags = collections.defaultdict(list)
+        pattern = re.compile(r"tag-type-([^\"' ]+).*?[?;]tags=([^\"'+]+)")
+        for tag_type, tag_name in pattern.findall(tag_container):
+            tags[tag_type].append(text.unquote(tag_name))
+        for key, value in tags.items():
+            post["tags_" + key] = " ".join(value)
+
+    def _notes(self, post, page):
+        note_container = text.extr(page, 'id="note-container"', "<img ")
+        if not note_container:
+            return
+
+        post["notes"] = notes = []
+        for note in note_container.split('class="note-box"')[1:]:
+            extr = text.extract_from(note)
+            notes.append({
+                "width" : int(extr("width:", "p")),
+                "height": int(extr("height:", "p")),
+                "y"     : int(extr("top:", "p")),
+                "x"     : int(extr("left:", "p")),
+                "id"    : int(extr('id="note-body-', '"')),
+                "body"  : text.unescape(text.remove_html(extr(">", "</div>"))),
+            })
 
     def _pagination(self, url, params):
         params["page"] = self.page_start
@@ -96,6 +117,37 @@
                 "tags_general": str,
             },
         }),
+        ("https://yande.re/post/show/993156", {
+            "content": "fed722bd90f48de41ec163692befc701056e2b1e",
+            "options": (("notes", True),),
+            "keyword": {
+                "notes": [
+                    {
+                        "id": 7096,
+                        "x" : 90,
+                        "y" : 626,
+                        "width" : 283,
+                        "height": 529,
+                        "body"  : "Please keep this as a secret for me!!",
+                    },
+                    {
+                        "id": 7095,
+                        "x" : 900,
+                        "y" : 438,
+                        "width" : 314,
+                        "height": 588,
+                        "body"  : "The facts that I love playing games",
+                    },
+                ],
+            },
+        }),
+        ("https://lolibooru.moe/post/show/281305/", {
+            "content": "a331430223ffc5b23c31649102e7d49f52489b57",
+            "options": (("notes", True),),
+            "keyword": {
+                "notes": list,
+            },
+        }),
         ("https://konachan.net/post/show/205189"),
         ("https://www.sakugabooru.com/post/show/125570"),
         ("https://lolibooru.moe/post/show/287835"),
diff -Nru gallery-dl-1.23.2/gallery_dl/extractor/myhentaigallery.py gallery-dl-1.24.0/gallery_dl/extractor/myhentaigallery.py
--- gallery-dl-1.23.2/gallery_dl/extractor/myhentaigallery.py	2022-07-12 13:49:22.000000000 +0000
+++ gallery-dl-1.24.0/gallery_dl/extractor/myhentaigallery.py	2022-11-10 12:38:30.000000000 +0000
@@ -59,7 +59,7 @@
 
     def images(self, page):
         return [
-            (text.unescape(text.extract(url, 'src="', '"')[0]).replace(
+            (text.unescape(text.extr(url, 'src="', '"')).replace(
                 "/thumbnail/", "/original/"), None)
             for url in text.extract_iter(page, 'class="comic-thumb"', '</div>')
         ]
diff -Nru gallery-dl-1.23.2/gallery_dl/extractor/myportfolio.py gallery-dl-1.24.0/gallery_dl/extractor/myportfolio.py
--- gallery-dl-1.23.2/gallery_dl/extractor/myportfolio.py	2022-09-30 14:46:45.000000000 +0000
+++ gallery-dl-1.24.0/gallery_dl/extractor/myportfolio.py	2022-11-10 12:38:30.000000000 +0000
@@ -57,8 +57,8 @@
             raise exception.NotFoundError()
         page = response.text
 
-        projects = text.extract(
-            page, '<section class="project-covers', '</section>')[0]
+        projects = text.extr(
+            page, '<section class="project-covers', '</section>')
 
         if projects:
             data = {"_extractor": MyportfolioGalleryExtractor}
diff -Nru gallery-dl-1.23.2/gallery_dl/extractor/nana.py gallery-dl-1.24.0/gallery_dl/extractor/nana.py
--- gallery-dl-1.23.2/gallery_dl/extractor/nana.py	1970-01-01 00:00:00.000000000 +0000
+++ gallery-dl-1.24.0/gallery_dl/extractor/nana.py	2022-11-10 12:38:30.000000000 +0000
@@ -0,0 +1,115 @@
+# -*- coding: utf-8 -*-
+
+# This program is free software; you can redistribute it and/or modify
+# it under the terms of the GNU General Public License version 2 as
+# published by the Free Software Foundation.
+
+"""Extractors for https://nana.my.id/"""
+
+from .common import GalleryExtractor, Extractor, Message
+from .. import text, exception
+import json
+
+
+class NanaGalleryExtractor(GalleryExtractor):
+    """Extractor for image galleries from nana.my.id"""
+    category = "nana"
+    directory_fmt = ("{category}", "{title}")
+    pattern = r"(?:https?://)?nana\.my\.id/reader/([^/?#]+)"
+    test = (
+        (("https://nana.my.id/reader/"
+          "059f7de55a4297413bfbd432ce7d6e724dd42bae"), {
+            "pattern": r"https://nana\.my\.id/reader/"
+                       r"\w+/image/page\?path=.*\.\w+",
+            "title"  : "Everybody Loves Shion",
+            "artist" : "fuzui",
+            "tags"   : list,
+            "count"  : 29,
+        }),
+        (("https://nana.my.id/reader/"
+          "77c8712b67013e427923573379f5bafcc0c72e46"), {
+            "pattern": r"https://nana\.my\.id/reader/"
+                       r"\w+/image/page\?path=.*\.\w+",
+            "title"  : "Lovey-Dovey With an Otaku-Friendly Gyaru",
+            "artist" : "Sueyuu",
+            "tags"   : ["Sueyuu"],
+            "count"  : 58,
+        }),
+    )
+
+    def __init__(self, match):
+        self.gallery_id = match.group(1)
+        url = "https://nana.my.id/reader/" + self.gallery_id
+        GalleryExtractor.__init__(self, match, url)
+
+    def metadata(self, page):
+        title = text.unescape(
+            text.extr(page, '</a>&nbsp; ', '</div>'))
+        artist = text.unescape(text.extr(
+            page, '<title>', '</title>'))[len(title):-10]
+        tags = text.extr(page, 'Reader.tags = "', '"')
+
+        return {
+            "gallery_id": self.gallery_id,
+            "title"     : title,
+            "artist"    : artist[4:] if artist.startswith(" by ") else "",
+            "tags"      : tags.split(", ") if tags else (),
+            "lang"      : "en",
+            "language"  : "English",
+        }
+
+    def images(self, page):
+        data = json.loads(text.extr(page, "Reader.pages = ", ".pages"))
+        return [
+            ("https://nana.my.id" + image, None)
+            for image in data["pages"]
+        ]
+
+
+class NanaSearchExtractor(Extractor):
+    """Extractor for nana search results"""
+    category = "nana"
+    subcategory = "search"
+    pattern = r"(?:https?://)?nana\.my\.id(?:/?\?([^#]+))"
+    test = (
+        ('https://nana.my.id/?q=+"elf"&sort=desc', {
+            "pattern": NanaGalleryExtractor.pattern,
+            "range": "1-100",
+            "count": 100,
+        }),
+        ("https://nana.my.id/?q=favorites%3A", {
+            "pattern": NanaGalleryExtractor.pattern,
+            "count": ">= 2",
+        }),
+    )
+
+    def __init__(self, match):
+        Extractor.__init__(self, match)
+        self.params = text.parse_query(match.group(1))
+        self.params["p"] = text.parse_int(self.params.get("p"), 1)
+        self.params["q"] = self.params.get("q") or ""
+
+    def items(self):
+        if "favorites:" in self.params["q"]:
+            favkey = self.config("favkey")
+            if not favkey:
+                raise exception.AuthenticationError(
+                    "'Favorite key' not provided. "
+                    "Please see 'https://nana.my.id/tutorial'")
+            self.session.cookies.set("favkey", favkey, domain="nana.my.id")
+
+        data = {"_extractor": NanaGalleryExtractor}
+        while True:
+            try:
+                page = self.request(
+                    "https://nana.my.id", params=self.params).text
+            except exception.HttpError:
+                return
+
+            for gallery in text.extract_iter(
+                    page, '<div class="id3">', '</div>'):
+                url = "https://nana.my.id" + text.extr(
+                    gallery, '<a href="', '"')
+                yield Message.Queue, url, data
+
+            self.params["p"] += 1
diff -Nru gallery-dl-1.23.2/gallery_dl/extractor/naverwebtoon.py gallery-dl-1.24.0/gallery_dl/extractor/naverwebtoon.py
--- gallery-dl-1.23.2/gallery_dl/extractor/naverwebtoon.py	2022-05-30 10:58:03.000000000 +0000
+++ gallery-dl-1.24.0/gallery_dl/extractor/naverwebtoon.py	2022-11-10 12:38:30.000000000 +0000
@@ -76,7 +76,7 @@
 
     @staticmethod
     def images(page):
-        view_area = text.extract(page, 'id="comic_view_area"', '</div>')[0]
+        view_area = text.extr(page, 'id="comic_view_area"', '</div>')
         return [
             (url, None)
             for url in text.extract_iter(view_area, '<img src="', '"')
diff -Nru gallery-dl-1.23.2/gallery_dl/extractor/newgrounds.py gallery-dl-1.24.0/gallery_dl/extractor/newgrounds.py
--- gallery-dl-1.23.2/gallery_dl/extractor/newgrounds.py	2022-09-30 14:46:45.000000000 +0000
+++ gallery-dl-1.24.0/gallery_dl/extractor/newgrounds.py	2022-11-10 12:38:30.000000000 +0000
@@ -88,8 +88,8 @@
             return self.session.cookies
 
         headers = {"Origin": self.root, "Referer": url}
-        url = text.urljoin(self.root, text.extract(
-            response.text, 'action="', '"')[0])
+        url = text.urljoin(self.root, text.extr(
+            response.text, 'action="', '"'))
         data = {
             "username": username,
             "password": password,
@@ -140,7 +140,7 @@
         data["score"] = text.parse_float(extr('id="score_number">', '<'))
         data["tags"] = text.split_html(extr('<dd class="tags">', '</dd>'))
         data["artist"] = [
-            text.extract(user, '//', '.')[0]
+            text.extr(user, '//', '.')
             for user in text.extract_iter(page, '<div class="item-user">', '>')
         ]
 
@@ -275,7 +275,7 @@
 
             for year, items in items.items():
                 for item in items:
-                    page_url = text.extract(item, 'href="', '"')[0]
+                    page_url = text.extr(item, 'href="', '"')
                     if page_url[0] == "/":
                         page_url = self.root + page_url
                     yield page_url
diff -Nru gallery-dl-1.23.2/gallery_dl/extractor/ngomik.py gallery-dl-1.24.0/gallery_dl/extractor/ngomik.py
--- gallery-dl-1.23.2/gallery_dl/extractor/ngomik.py	2021-12-11 02:38:22.000000000 +0000
+++ gallery-dl-1.24.0/gallery_dl/extractor/ngomik.py	1970-01-01 00:00:00.000000000 +0000
@@ -1,51 +0,0 @@
-# -*- coding: utf-8 -*-
-
-# Copyright 2018-2019 Mike Fährmann
-#
-# This program is free software; you can redistribute it and/or modify
-# it under the terms of the GNU General Public License version 2 as
-# published by the Free Software Foundation.
-
-"""Extract manga-chapters and entire manga from http://ngomik.in/"""
-
-from .common import ChapterExtractor
-from .. import text
-import re
-
-
-class NgomikChapterExtractor(ChapterExtractor):
-    """Extractor for manga-chapters from ngomik.in"""
-    category = "ngomik"
-    root = "http://ngomik.in"
-    pattern = (r"(?:https?://)?(?:www\.)?ngomik\.in"
-               r"(/[^/?#]+-chapter-[^/?#]+)")
-    test = (
-        ("https://www.ngomik.in/14-sai-no-koi-chapter-1-6/", {
-            "url": "8e67fdf751bbc79bc6f4dead7675008ddb8e32a4",
-            "keyword": "204d177f09d438fd50c9c28d98c73289194640d8",
-        }),
-        ("https://ngomik.in/break-blade-chapter-26/", {
-            "count": 34,
-        }),
-    )
-
-    def metadata(self, page):
-        info = text.extract(page, '<title>', "</title>")[0]
-        manga, _, chapter = info.partition(" Chapter ")
-        chapter, sep, minor = chapter.partition(" ")[0].partition(".")
-
-        return {
-            "manga": text.unescape(manga),
-            "chapter": text.parse_int(chapter),
-            "chapter_minor": sep + minor,
-            "lang": "id",
-            "language": "Indonesian",
-        }
-
-    @staticmethod
-    def images(page):
-        readerarea = text.extract(page, 'id="readerarea"', 'class="chnav"')[0]
-        return [
-            (text.unescape(url), None)
-            for url in re.findall(r"\ssrc=[\"']?([^\"' >]+)", readerarea)
-        ]
diff -Nru gallery-dl-1.23.2/gallery_dl/extractor/nijie.py gallery-dl-1.24.0/gallery_dl/extractor/nijie.py
--- gallery-dl-1.23.2/gallery_dl/extractor/nijie.py	2022-08-27 19:50:27.000000000 +0000
+++ gallery-dl-1.24.0/gallery_dl/extractor/nijie.py	2022-11-10 12:38:30.000000000 +0000
@@ -107,7 +107,7 @@
         """Extract image URLs from 'page'"""
         images = text.extract_iter(page, "/view_popup.php", "</a>")
         for num, image in enumerate(images):
-            src = text.extract(image, 'src="', '"')[0]
+            src = text.extr(image, 'src="', '"')
             if not src:
                 continue
             url = ("https:" + src).replace("/__rs_l120x120/", "/")
@@ -118,7 +118,7 @@
 
     @staticmethod
     def _extract_user_name(page):
-        return text.unescape(text.extract(page, "<br />", "<")[0] or "")
+        return text.unescape(text.extr(page, "<br />", "<"))
 
     def login(self):
         """Login and obtain session cookies"""
@@ -322,8 +322,56 @@
 
     @staticmethod
     def _extract_user_name(page):
-        return text.unescape(text.extract(
-            page, "<title>", "さんの抜いた")[0] or "")
+        return text.unescape(text.extr(page, "<title>", "さんの抜いた"))
+
+
+class NijieFeedExtractor(NijieExtractor):
+    """Extractor for nijie liked user feed"""
+    subcategory = "feed"
+    pattern = BASE_PATTERN + r"/like_user_view\.php"
+    test = (
+        ("https://nijie.info/like_user_view.php", {
+            "range": "1-10",
+            "count": 10,
+        }),
+        ("https://horne.red/like_user_view.php"),
+    )
+
+    def image_ids(self):
+        return self._pagination("like_user_view")
+
+    @staticmethod
+    def _extract_user_name(page):
+        return ""
+
+
+class NijiefollowedExtractor(NijieExtractor):
+    """Extractor for followed nijie users"""
+    subcategory = "followed"
+    pattern = BASE_PATTERN + r"/like_my\.php"
+    test = (
+        ("https://nijie.info/like_my.php"),
+        ("https://horne.red/like_my.php"),
+    )
+
+    def items(self):
+        self.login()
+
+        url = self.root + "/like_my.php"
+        params = {"p": 1}
+        data = {"_extractor": NijieUserExtractor}
+
+        while True:
+            page = self.request(url, params=params).text
+
+            for user_id in text.extract_iter(
+                    page, '"><a href="/members.php?id=', '"'):
+                user_url = "{}/members.php?id={}".format(self.root, user_id)
+                yield Message.Queue, user_url, data
+
+            if '<a rel="next"' not in page:
+                return
+            params["p"] += 1
 
 
 class NijieImageExtractor(NijieExtractor):
diff -Nru gallery-dl-1.23.2/gallery_dl/extractor/nitter.py gallery-dl-1.24.0/gallery_dl/extractor/nitter.py
--- gallery-dl-1.23.2/gallery_dl/extractor/nitter.py	1970-01-01 00:00:00.000000000 +0000
+++ gallery-dl-1.24.0/gallery_dl/extractor/nitter.py	2022-11-15 11:32:45.000000000 +0000
@@ -0,0 +1,256 @@
+# -*- coding: utf-8 -*-
+
+# Copyright 2022 Mike Fährmann
+#
+# This program is free software; you can redistribute it and/or modify
+# it under the terms of the GNU General Public License version 2 as
+# published by the Free Software Foundation.
+
+"""Extractors for Nitter instances"""
+
+from .common import BaseExtractor, Message
+from .. import text
+
+
+class NitterExtractor(BaseExtractor):
+    """Base class for nitter extractors"""
+    basecategory = "nitter"
+    directory_fmt = ("{category}", "{user[name]}")
+    filename_fmt = "{tweet_id}_{num}.{extension}"
+    archive_fmt = "{tweet_id}_{num}"
+
+    def __init__(self, match):
+        BaseExtractor.__init__(self, match)
+        self.user = match.group(match.lastindex)
+
+    def items(self):
+        for tweet_html in self.tweets():
+            tweet = self._tweet_from_html(tweet_html)
+
+            attachments_html = tweet.pop("_attach", "")
+            if attachments_html:
+                attachments = list(text.extract_iter(
+                    attachments_html, 'href="', '"'))
+                attachments.extend(text.extract_iter(
+                    attachments_html, 'data-url="', '"'))
+            else:
+                attachments = ()
+            tweet["count"] = len(attachments)
+
+            yield Message.Directory, tweet
+            for tweet["num"], url in enumerate(attachments, 1):
+                if url[0] == "/":
+                    url = self.root + url
+                if "/video/" in url:
+                    url = "ytdl:" + url
+                    tweet["filename"] = url.rpartition(
+                        "%2F")[2].partition(".")[0]
+                    tweet["extension"] = "mp4"
+                else:
+                    text.nameext_from_url(url, tweet)
+                yield Message.Url, url, tweet
+
+    def _tweet_from_html(self, html):
+        extr = text.extract_from(html)
+        user = {
+            "name": extr('class="fullname" href="/', '"'),
+            "nick": extr('title="', '"'),
+        }
+        extr('<span class="tweet-date', '')
+        link = extr('href="', '"')
+        return {
+            "user": user,
+            "date": text.parse_datetime(
+                extr('title="', '"'), "%b %d, %Y · %I:%M %p %Z"),
+            "tweet_id": link.rpartition("/")[2].partition("#")[0],
+            "content": extr('class="tweet-content', "</div").partition(">")[2],
+            "_attach": extr('class="attachments', 'class="tweet-stats'),
+            "comments": text.parse_int(extr(
+                'class="icon-comment', '</div>').rpartition(">")[2]),
+            "retweets": text.parse_int(extr(
+                'class="icon-retweet', '</div>').rpartition(">")[2]),
+            "quotes"  : text.parse_int(extr(
+                'class="icon-quote', '</div>').rpartition(">")[2]),
+            "likes"   : text.parse_int(extr(
+                'class="icon-heart', '</div>').rpartition(">")[2]),
+        }
+
+    def _pagination(self, path):
+        base_url = url = self.root + path
+
+        while True:
+            page = self.request(url).text
+
+            yield from page.split('<div class="timeline-item')[1:]
+
+            more = text.extr(page, '<div class="show-more"><a href="?', '"')
+            if not more:
+                return
+            url = base_url + "?" + text.unescape(more)
+
+
+BASE_PATTERN = NitterExtractor.update({
+    "nitter.net": {
+        "root": "https://nitter.net",
+        "pattern": r"nitter\.net",
+    },
+    "nitter.lacontrevoie.fr": {
+        "root": "https://nitter.lacontrevoie.fr",
+        "pattern": r"nitter\.lacontrevoie\.fr",
+    },
+    "nitter.pussthecat.org": {
+        "root": "https://nitter.pussthecat.org",
+        "pattern": r"nitter\.pussthecat\.org",
+    },
+    "nitter.1d4.us": {
+        "root": "https://nitter.1d4.us",
+        "pattern": r"nitter\.1d4\.us",
+    },
+    "nitter.kavin.rocks": {
+        "root": "https://nitter.kavin.rocks",
+        "pattern": r"nitter\.kavin\.rocks",
+    },
+    "nitter.unixfox.eu": {
+        "root": "https://nitter.unixfox.eu",
+        "pattern": r"nitter\.unixfox\.eu",
+    },
+})
+
+
+class NitterTweetsExtractor(NitterExtractor):
+    subcategory = "tweets"
+    pattern = BASE_PATTERN + r"/([^/?#]+)(?:/tweets)?(?:$|\?|#)"
+    test = (
+        ("https://nitter.net/supernaturepics", {
+            "pattern": r"https://nitter\.net/pic/orig"
+                       r"/media%2F[\w-]+\.(jpg|png)$",
+            "range": "1-20",
+            "count": 20,
+            "keyword": {
+                "comments": int,
+                "content": str,
+                "count": 1,
+                "date": "type:datetime",
+                "likes": int,
+                "quotes": int,
+                "retweets": int,
+                "tweet_id": r"re:\d+",
+                "user": {
+                    "name": "supernaturepics",
+                    "nick": "Nature Pictures"
+                },
+            },
+        }),
+        ("https://nitter.lacontrevoie.fr/supernaturepics"),
+        ("https://nitter.pussthecat.org/supernaturepics"),
+        ("https://nitter.1d4.us/supernaturepics"),
+        ("https://nitter.kavin.rocks/supernaturepics"),
+        ("https://nitter.unixfox.eu/supernaturepics"),
+    )
+
+    def tweets(self):
+        return self._pagination("/" + self.user)
+
+
+class NitterRepliesExtractor(NitterExtractor):
+    subcategory = "replies"
+    pattern = BASE_PATTERN + r"/([^/?#]+)/with_replies"
+    test = (
+        ("https://nitter.net/supernaturepics/with_replies", {
+            "pattern": r"https://nitter\.net/pic/orig"
+                       r"/media%2F[\w-]+\.(jpg|png)$",
+            "range": "1-20",
+        }),
+        ("https://nitter.lacontrevoie.fr/supernaturepics/with_replies"),
+        ("https://nitter.pussthecat.org/supernaturepics/with_replies"),
+        ("https://nitter.1d4.us/supernaturepics/with_replies"),
+        ("https://nitter.kavin.rocks/supernaturepics/with_replies"),
+        ("https://nitter.unixfox.eu/supernaturepics/with_replies"),
+    )
+
+    def tweets(self):
+        return self._pagination("/" + self.user + "/with_replies")
+
+
+class NitterMediaExtractor(NitterExtractor):
+    subcategory = "media"
+    pattern = BASE_PATTERN + r"/([^/?#]+)/media"
+    test = (
+        ("https://nitter.net/supernaturepics/media", {
+            "pattern": r"https://nitter\.net/pic/orig"
+                       r"/media%2F[\w-]+\.(jpg|png)$",
+            "range": "1-20",
+        }),
+        ("https://nitter.lacontrevoie.fr/supernaturepics/media"),
+        ("https://nitter.pussthecat.org/supernaturepics/media"),
+        ("https://nitter.1d4.us/supernaturepics/media"),
+        ("https://nitter.kavin.rocks/supernaturepics/media"),
+        ("https://nitter.unixfox.eu/supernaturepics/media"),
+    )
+
+    def tweets(self):
+        return self._pagination("/" + self.user + "/media")
+
+
+class NitterSearchExtractor(NitterExtractor):
+    subcategory = "search"
+    pattern = BASE_PATTERN + r"/([^/?#]+)/search"
+    test = (
+        ("https://nitter.net/supernaturepics/search", {
+            "pattern": r"https://nitter\.net/pic/orig"
+                       r"/media%2F[\w-]+\.(jpg|png)$",
+            "range": "1-20",
+        }),
+        ("https://nitter.lacontrevoie.fr/supernaturepics/search"),
+        ("https://nitter.pussthecat.org/supernaturepics/search"),
+        ("https://nitter.1d4.us/supernaturepics/search"),
+        ("https://nitter.kavin.rocks/supernaturepics/search"),
+        ("https://nitter.unixfox.eu/supernaturepics/search"),
+    )
+
+    def tweets(self):
+        return self._pagination("/" + self.user + "/search")
+
+
+class NitterTweetExtractor(NitterExtractor):
+    """Extractor for nitter tweets"""
+    subcategory = "tweet"
+    directory_fmt = ("{category}", "{user[name]}")
+    filename_fmt = "{tweet_id}_{num}.{extension}"
+    archive_fmt = "{tweet_id}_{num}"
+    pattern = BASE_PATTERN + r"/[^/?#]+/status/(\d+)"
+    test = (
+        ("https://nitter.net/supernaturepics/status/604341487988576256", {
+            "url": "3f2b64e175bf284aa672c3bb53ed275e470b919a",
+            "content": "ab05e1d8d21f8d43496df284d31e8b362cd3bcab",
+        }),
+        # 4 images
+        ("https://nitter.lacontrevoie.fr/i/status/894001459754180609", {
+            "url": "9c51b3a4a1114535eb9b168bba97ad95db0d59ff",
+        }),
+        # video
+        ("https://nitter.pussthecat.org/i/status/1065692031626829824", {
+            "pattern": r"ytdl:https://nitter.pussthecat.org/video"
+                       r"/B875137EDC8FF/https%3A%2F%2Fvideo.twimg.com%2F"
+                       r"ext_tw_video%2F1065691868439007232%2Fpu%2Fpl%2F"
+                       r"nv8hUQC1R0SjhzcZ.m3u8%3Ftag%3D5",
+        }),
+        # content with emoji, newlines, hashtags (#338)
+        ("https://nitter.1d4.us/playpokemon/status/1263832915173048321", {
+            "keyword": {"content": (
+                r"re:Gear up for #PokemonSwordShieldEX with special Mystery "
+                "Gifts! \n\nYou’ll be able to receive four Galarian form "
+                "Pokémon with Hidden Abilities, plus some very useful items. "
+                "It’s our \\(Mystery\\) Gift to you, Trainers! \n\n❓🎁➡️ "
+            )},
+        }),
+        # Nitter tweet (#890)
+        ("https://nitter.kavin.rocks/ed1conf/status/1163841619336007680", {
+            "url": "e115bd1c86c660064e392b05269bbcafcd8c8b7a",
+            "content": "f29501e44d88437fe460f5c927b7543fda0f6e34",
+        }),
+    )
+
+    def tweets(self):
+        url = "{}/i/status/{}".format(self.root, self.user)
+        return (self.request(url).text,)
diff -Nru gallery-dl-1.23.2/gallery_dl/extractor/nozomi.py gallery-dl-1.24.0/gallery_dl/extractor/nozomi.py
--- gallery-dl-1.23.2/gallery_dl/extractor/nozomi.py	2022-07-13 20:32:34.000000000 +0000
+++ gallery-dl-1.24.0/gallery_dl/extractor/nozomi.py	2022-11-08 16:10:24.000000000 +0000
@@ -62,10 +62,11 @@
 
             yield Message.Directory, post
             for post["num"], image in enumerate(images, 1):
-                post["url"] = url = text.urljoin(self.root, image["imageurl"])
-                text.nameext_from_url(url, post)
-                post["is_video"] = bool(image.get("is_video"))
-                post["dataid"] = post["filename"]
+                post["filename"] = post["dataid"] = did = image["dataid"]
+                post["extension"] = ext = image["type"]
+                post["is_video"] = video = bool(image.get("is_video"))
+                post["url"] = url = "https://{}.nozomi.la/{}/{}/{}.{}".format(
+                    "v" if video else "i", did[-1], did[-3:-1], did, ext)
                 yield Message.Url, url, post
 
     def posts(self):
@@ -109,7 +110,6 @@
                 "height"   : 768,
                 "is_video" : False,
                 "postid"   : 3649262,
-                "source"   : "danbooru",
                 "tags"     : list,
                 "type"     : "jpg",
                 "url"      : str,
@@ -119,7 +119,7 @@
         #  multiple images per post
         ("https://nozomi.la/post/25588032.html", {
             "url": "6aa3b7db385abcc9d374bdffd19187bccbf8f228",
-            "keyword": "f60e048df36308b6b25dfaac419b586895d360bc",
+            "keyword": "2a2998af93c6438863c4077bd386b613b8bc2957",
             "count": 7,
         }),
         # empty 'date' (#1163)
@@ -160,7 +160,7 @@
     archive_fmt = "t_{search_tags}_{dataid}"
     pattern = r"(?:https?://)?nozomi\.la/tag/([^/?#]+)-(\d+)\."
     test = ("https://nozomi.la/tag/3:1_aspect_ratio-1.html", {
-        "pattern": r"^https://i.nozomi.la/\w/\w\w/\w+\.\w+$",
+        "pattern": r"^https://[iv]\.nozomi\.la/\w/\w\w/\w+\.\w+$",
         "count": ">= 25",
         "range": "1-25",
     })
diff -Nru gallery-dl-1.23.2/gallery_dl/extractor/patreon.py gallery-dl-1.24.0/gallery_dl/extractor/patreon.py
--- gallery-dl-1.23.2/gallery_dl/extractor/patreon.py	2022-05-03 10:22:33.000000000 +0000
+++ gallery-dl-1.24.0/gallery_dl/extractor/patreon.py	2022-11-10 12:38:30.000000000 +0000
@@ -95,7 +95,7 @@
         if content:
             for img in text.extract_iter(
                     content, '<img data-media-id="', '>'):
-                url = text.extract(img, 'src="', '"')[0]
+                url = text.extr(img, 'src="', '"')
                 if url:
                     yield "content", url, self._filename(url) or url
 
@@ -181,7 +181,7 @@
         """Fetch filename from an URL's Content-Disposition header"""
         response = self.request(url, method="HEAD", fatal=False)
         cd = response.headers.get("Content-Disposition")
-        return text.extract(cd, 'filename="', '"')[0]
+        return text.extr(cd, 'filename="', '"')
 
     @staticmethod
     def _filehash(url):
@@ -284,7 +284,7 @@
             url = "{}/{}/posts".format(self.root, self.creator)
 
         page = self.request(url, notfound="creator").text
-        campaign_id = text.extract(page, "/campaign/", "/")[0]
+        campaign_id = text.extr(page, "/campaign/", "/")
         if not campaign_id:
             raise exception.NotFoundError("creator")
 
diff -Nru gallery-dl-1.23.2/gallery_dl/extractor/philomena.py gallery-dl-1.24.0/gallery_dl/extractor/philomena.py
--- gallery-dl-1.23.2/gallery_dl/extractor/philomena.py	2022-08-27 21:18:06.000000000 +0000
+++ gallery-dl-1.24.0/gallery_dl/extractor/philomena.py	2022-11-10 12:38:30.000000000 +0000
@@ -27,10 +27,6 @@
     def _prepare(post):
         post["date"] = text.parse_datetime(post["created_at"])
 
-    @staticmethod
-    def _extended_tags(post):
-        pass
-
     def _pagination(self, url, params):
         params["page"] = 1
         params["per_page"] = self.per_page
diff -Nru gallery-dl-1.23.2/gallery_dl/extractor/photobucket.py gallery-dl-1.24.0/gallery_dl/extractor/photobucket.py
--- gallery-dl-1.23.2/gallery_dl/extractor/photobucket.py	2022-05-03 10:22:33.000000000 +0000
+++ gallery-dl-1.24.0/gallery_dl/extractor/photobucket.py	2022-11-10 12:38:30.000000000 +0000
@@ -75,7 +75,7 @@
             page = self.request(url, params=params).text
             json_data = text.extract(page, "collectionData:", ",\n")[0]
             if not json_data:
-                msg = text.extract(page, 'libraryPrivacyBlock">', "</div>")[0]
+                msg = text.extr(page, 'libraryPrivacyBlock">', "</div>")
                 msg = ' ("{}")'.format(text.remove_html(msg)) if msg else ""
                 self.log.error("Unable to get JSON data%s", msg)
                 return
diff -Nru gallery-dl-1.23.2/gallery_dl/extractor/pillowfort.py gallery-dl-1.24.0/gallery_dl/extractor/pillowfort.py
--- gallery-dl-1.23.2/gallery_dl/extractor/pillowfort.py	2022-05-03 10:22:33.000000000 +0000
+++ gallery-dl-1.24.0/gallery_dl/extractor/pillowfort.py	2022-11-10 12:38:30.000000000 +0000
@@ -98,7 +98,7 @@
 
         url = "https://www.pillowfort.social/users/sign_in"
         page = self.request(url).text
-        auth = text.extract(page, 'name="authenticity_token" value="', '"')[0]
+        auth = text.extr(page, 'name="authenticity_token" value="', '"')
 
         headers = {"Origin": self.root, "Referer": url}
         data = {
diff -Nru gallery-dl-1.23.2/gallery_dl/extractor/pixiv.py gallery-dl-1.24.0/gallery_dl/extractor/pixiv.py
--- gallery-dl-1.23.2/gallery_dl/extractor/pixiv.py	2022-09-30 14:46:45.000000000 +0000
+++ gallery-dl-1.24.0/gallery_dl/extractor/pixiv.py	2022-11-15 11:32:45.000000000 +0000
@@ -45,6 +45,7 @@
                 work["tags"] = [tag["name"] for tag in work["tags"]]
 
         ratings = {0: "General", 1: "R-18", 2: "R-18G"}
+        userdata = self.config("metadata")
         metadata = self.metadata()
 
         works = self.works()
@@ -60,6 +61,8 @@
             del work["image_urls"]
             del work["meta_pages"]
 
+            if userdata:
+                work.update(self.api.user_detail(work["user"]["id"]))
             if transform_tags:
                 transform_tags(work)
             work["num"] = 0
@@ -198,7 +201,7 @@
 
     def metadata(self):
         if self.config("metadata"):
-            return self.api.user_detail(self.user_id)
+            self.api.user_detail(self.user_id)
         return {}
 
     def works(self):
@@ -459,6 +462,9 @@
         ("https://www.pixiv.net/ranking.php?mode=daily&date=20170818"),
         ("https://www.pixiv.net/ranking.php"),
         ("https://touch.pixiv.net/ranking.php"),
+        ("https://www.pixiv.net/ranking.php?mode=unknown", {
+            "exception": exception.StopExtraction,
+        }),
     )
 
     def __init__(self, match):
@@ -476,6 +482,8 @@
         mode_map = {
             "daily": "day",
             "daily_r18": "day_r18",
+            "daily_ai": "day_ai",
+            "daily_r18_ai": "day_r18_ai",
             "weekly": "week",
             "weekly_r18": "week_r18",
             "monthly": "month",
@@ -487,10 +495,10 @@
             "rookie": "week_rookie",
             "r18g": "week_r18g",
         }
-        if mode not in mode_map:
-            self.log.warning("invalid mode '%s'", mode)
-            mode = "daily"
-        self.mode = mode_map[mode]
+        try:
+            self.mode = mode = mode_map[mode]
+        except KeyError:
+            raise exception.StopExtraction("Invalid mode '%s'", mode)
 
         date = query.get("date")
         if date:
@@ -522,6 +530,15 @@
             "range": "1-10",
             "count": 10,
         }),
+        ("https://pixiv.net/en/tags/foo/artworks?order=week&s_mode=s_tag", {
+            "exception": exception.StopExtraction,
+        }),
+        ("https://pixiv.net/en/tags/foo/artworks?order=date&s_mode=tag", {
+            "exception": exception.StopExtraction,
+        }),
+        ("https://www.pixiv.net/search.php?s_mode=s_tag&name=Original", {
+            "exception": exception.StopExtraction,
+        }),
         ("https://www.pixiv.net/en/tags/foo/artworks?order=date&s_mode=s_tag"),
         ("https://www.pixiv.net/search.php?s_mode=s_tag&word=Original"),
         ("https://touch.pixiv.net/search.php?word=Original"),
@@ -543,30 +560,31 @@
         if self.word:
             self.word = text.unquote(self.word)
         else:
-            if "word" not in query:
+            try:
+                self.word = query["word"]
+            except KeyError:
                 raise exception.StopExtraction("Missing search term")
-            self.word = query["word"]
 
         sort = query.get("order", "date_d")
         sort_map = {
             "date": "date_asc",
             "date_d": "date_desc",
         }
-        if sort not in sort_map:
-            self.log.warning("invalid sort order '%s'", sort)
-            sort = "date_d"
-        self.sort = sort_map[sort]
+        try:
+            self.sort = sort = sort_map[sort]
+        except KeyError:
+            raise exception.StopExtraction("Invalid search order '%s'", sort)
 
-        target = query.get("s_mode", "s_tag")
+        target = query.get("s_mode", "s_tag_full")
         target_map = {
             "s_tag": "partial_match_for_tags",
             "s_tag_full": "exact_match_for_tags",
             "s_tc": "title_and_caption",
         }
-        if target not in target_map:
-            self.log.warning("invalid search target '%s'", target)
-            target = "s_tag"
-        self.target = target_map[target]
+        try:
+            self.target = target = target_map[target]
+        except KeyError:
+            raise exception.StopExtraction("Invalid search mode '%s'", target)
 
         self.date_start = query.get("scd")
         self.date_end = query.get("ecd")
@@ -635,7 +653,7 @@
         headers = {"User-Agent": "Mozilla/5.0"}
         self.page = self.request(url, headers=headers).text
 
-        title = text.extract(self.page, '<title>', '<')[0]
+        title = text.extr(self.page, '<title>', '<')
         return {
             "pixivision_id"   : self.pixivision_id,
             "pixivision_title": text.unescape(title),
@@ -689,7 +707,7 @@
             series = body["extraData"]["meta"]
             series["id"] = self.series_id
             series["total"] = page["total"]
-            series["title"] = text.extract(series["title"], '"', '"')[0]
+            series["title"] = text.extr(series["title"], '"', '"')
 
             for info in page["series"]:
                 work = self.api.illust_detail(info["workId"])
diff -Nru gallery-dl-1.23.2/gallery_dl/extractor/pixnet.py gallery-dl-1.24.0/gallery_dl/extractor/pixnet.py
--- gallery-dl-1.23.2/gallery_dl/extractor/pixnet.py	2022-05-03 10:22:33.000000000 +0000
+++ gallery-dl-1.24.0/gallery_dl/extractor/pixnet.py	2022-11-10 12:38:30.000000000 +0000
@@ -30,7 +30,7 @@
     def items(self):
         url = self.url_fmt.format(self.root, self.item_id)
         page = self.request(url, encoding="utf-8").text
-        user = text.extract(page, '<meta name="author" content="', '";')[0]
+        user = text.extr(page, '<meta name="author" content="', '";')
         data = {
             "blog": self.blog,
             "user": user.rpartition(" (")[0],
@@ -52,13 +52,13 @@
         while True:
             yield from text.extract_iter(page, '<li id="', '</li>')
 
-            pnext = text.extract(page, 'class="nextBtn"', '>')[0]
+            pnext = text.extr(page, 'class="nextBtn"', '>')
             if pnext is None and 'name="albumpass">' in page:
                 raise exception.StopExtraction(
                     "Album %s is password-protected.", self.item_id)
             if "href" not in pnext:
                 return
-            url = self.root + text.extract(pnext, 'href="', '"')[0]
+            url = self.root + text.extr(pnext, 'href="', '"')
             page = self.request(url, encoding="utf-8").text
 
 
diff -Nru gallery-dl-1.23.2/gallery_dl/extractor/pururin.py gallery-dl-1.24.0/gallery_dl/extractor/pururin.py
--- gallery-dl-1.23.2/gallery_dl/extractor/pururin.py	2022-02-01 23:09:19.000000000 +0000
+++ gallery-dl-1.24.0/gallery_dl/extractor/pururin.py	2022-11-10 12:38:30.000000000 +0000
@@ -73,8 +73,8 @@
 
         url = "{}/read/{}/01/x".format(self.root, self.gallery_id)
         page = self.request(url).text
-        info = json.loads(binascii.a2b_base64(text.extract(
-            page, '<gallery-read encoded="', '"')[0]).decode())
+        info = json.loads(binascii.a2b_base64(text.extr(
+            page, '<gallery-read encoded="', '"')).decode())
         self._ext = info["image_extension"]
         self._cnt = info["total_pages"]
 
diff -Nru gallery-dl-1.23.2/gallery_dl/extractor/reactor.py gallery-dl-1.24.0/gallery_dl/extractor/reactor.py
--- gallery-dl-1.23.2/gallery_dl/extractor/reactor.py	2022-05-30 10:58:03.000000000 +0000
+++ gallery-dl-1.24.0/gallery_dl/extractor/reactor.py	2022-11-10 12:38:30.000000000 +0000
@@ -109,13 +109,13 @@
         tags.sort()
 
         for image in images:
-            url = text.extract(image, ' src="', '"')[0]
+            url = text.extr(image, ' src="', '"')
             if not url:
                 continue
             if url.startswith("//"):
                 url = "http:" + url
-            width = text.extract(image, ' width="', '"')[0]
-            height = text.extract(image, ' height="', '"')[0]
+            width = text.extr(image, ' width="', '"')
+            height = text.extr(image, ' height="', '"')
             image_id = url.rpartition("-")[2].partition(".")[0]
             num += 1
 
@@ -125,7 +125,7 @@
                 url = url.replace("/post/", "/post/full/")
 
             if self.gif and ("/post/webm/" in url or "/post/mp4/" in url):
-                gif_url = text.extract(image, '<a href="', '"')[0]
+                gif_url = text.extr(image, '<a href="', '"')
                 if not gif_url:
                     continue
                 url = gif_url
@@ -170,7 +170,7 @@
     subcategory = "tag"
     directory_fmt = ("{category}", "{search_tags}")
     archive_fmt = "{search_tags}_{post_id}_{num}"
-    pattern = BASE_PATTERN + r"/tag/([^/?#]+)"
+    pattern = BASE_PATTERN + r"/tag/([^/?#]+)(?:/[^/?#]+)?"
     test = (
         ("http://reactor.cc/tag/gif"),
         ("http://anime.reactor.cc/tag/Anime+Art"),
@@ -180,6 +180,10 @@
         ("http://joyreactor.com/tag/Cirno", {
             "url": "aa59090590b26f4654881301fe8fe748a51625a8",
         }),
+        # 'best' rating (#3073)
+        ("http://joyreactor.com/tag/Dark+Souls+2/best", {
+            "count": 4,
+        }),
         ("http://pornreactor.cc/tag/RiceGnat", {
             "range": "1-25",
             "count": ">= 25",
diff -Nru gallery-dl-1.23.2/gallery_dl/extractor/redgifs.py gallery-dl-1.24.0/gallery_dl/extractor/redgifs.py
--- gallery-dl-1.23.2/gallery_dl/extractor/redgifs.py	2022-09-30 14:46:45.000000000 +0000
+++ gallery-dl-1.24.0/gallery_dl/extractor/redgifs.py	2022-11-08 16:10:24.000000000 +0000
@@ -10,6 +10,7 @@
 
 from .common import Extractor, Message
 from .. import text
+from ..cache import memcache
 
 
 class RedgifsExtractor(Extractor):
@@ -88,7 +89,7 @@
     pattern = r"(?:https?://)?(?:www\.)?redgifs\.com/browse/?\?([^#]+)"
     test = (
         ("https://www.redgifs.com/browse?tags=JAV", {
-            "pattern": r"https://\w+\.redgifs\.com/[A-Za-z]+\.mp4",
+            "pattern": r"https://\w+\.redgifs\.com/[A-Za-z-]+\.mp4",
             "range": "1-10",
             "count": 10,
         }),
@@ -131,6 +132,13 @@
 
     def __init__(self, extractor):
         self.extractor = extractor
+        self.headers = {
+            "Referer"       : extractor.root + "/",
+            "authorization" : None,
+            "content-type"  : "application/json",
+            "x-customheader": extractor.root + "/",
+            "Origin"        : extractor.root,
+        }
 
     def gif(self, gif_id):
         endpoint = "/v2/gifs/" + gif_id.lower()
@@ -149,7 +157,9 @@
 
     def _call(self, endpoint, params=None):
         url = self.API_ROOT + endpoint
-        return self.extractor.request(url, params=params).json()
+        self.headers["authorization"] = self._auth()
+        return self.extractor.request(
+            url, params=params, headers=self.headers).json()
 
     def _pagination(self, endpoint, params):
         params["page"] = 1
@@ -161,3 +171,11 @@
             if params["page"] >= data["pages"]:
                 return
             params["page"] += 1
+
+    @memcache(maxage=600)
+    def _auth(self):
+        # https://github.com/Redgifs/api/wiki/Temporary-tokens
+        url = self.API_ROOT + "/v2/auth/temporary"
+        self.headers["authorization"] = None
+        return "Bearer " + self.extractor.request(
+            url, headers=self.headers).json()["token"]
diff -Nru gallery-dl-1.23.2/gallery_dl/extractor/sankaku.py gallery-dl-1.24.0/gallery_dl/extractor/sankaku.py
--- gallery-dl-1.23.2/gallery_dl/extractor/sankaku.py	2022-10-01 09:48:25.000000000 +0000
+++ gallery-dl-1.24.0/gallery_dl/extractor/sankaku.py	2022-11-10 12:38:30.000000000 +0000
@@ -63,7 +63,7 @@
     def _check_expired(self, response):
         return not response.history or '.com/expired.png' not in response.url
 
-    def _extended_tags(self, post):
+    def _tags(self, post, page):
         tags = collections.defaultdict(list)
         types = self.TAG_TYPES
         for tag in post["tags"]:
@@ -306,7 +306,7 @@
                         url = post["file_url"]
                         if url:
                             expires = text.parse_int(
-                                text.extract(url, "e=", "&")[0]) - 60
+                                text.extr(url, "e=", "&")) - 60
 
                     if 0 < expires <= time():
                         self.extractor.log.debug("Refreshing download URLs")
diff -Nru gallery-dl-1.23.2/gallery_dl/extractor/sexcom.py gallery-dl-1.24.0/gallery_dl/extractor/sexcom.py
--- gallery-dl-1.23.2/gallery_dl/extractor/sexcom.py	2022-05-30 10:58:03.000000000 +0000
+++ gallery-dl-1.24.0/gallery_dl/extractor/sexcom.py	2022-11-10 12:38:30.000000000 +0000
@@ -43,7 +43,7 @@
                 yield self.root + href
 
             pager = extr('id="pagenum"', '</div>')
-            url = text.extract(pager, ' href="', '"')[0]
+            url = text.extr(pager, ' href="', '"')
             if not url:
                 return
             url = text.urljoin(self.root, url)
@@ -71,7 +71,7 @@
             info = extr("player.updateSrc(", ");")
 
             if info:
-                path = text.extract(info, "src: '", "'")[0]
+                path = text.extr(info, "src: '", "'")
                 data["filename"] = path.rpartition("/")[2]
                 data["extension"] = "mp4"
                 if "'HD'" in info:
@@ -79,8 +79,8 @@
                 data["url"] = self.root + path
             else:
                 iframe = extr('<iframe', '>')
-                src = (text.extract(iframe, ' src="', '"')[0] or
-                       text.extract(iframe, " src='", "'")[0])
+                src = (text.extr(iframe, ' src="', '"') or
+                       text.extr(iframe, " src='", "'"))
                 if not src:
                     self.log.warning("Unable to fetch media from %s", url)
                     return None
diff -Nru gallery-dl-1.23.2/gallery_dl/extractor/simplyhentai.py gallery-dl-1.24.0/gallery_dl/extractor/simplyhentai.py
--- gallery-dl-1.23.2/gallery_dl/extractor/simplyhentai.py	2022-02-01 23:09:19.000000000 +0000
+++ gallery-dl-1.24.0/gallery_dl/extractor/simplyhentai.py	2022-11-10 12:38:30.000000000 +0000
@@ -111,7 +111,7 @@
         url = extr('&quot;image&quot;:&quot;'  , '&')
         url = extr("&quot;content&quot;:&quot;", "&") or url
 
-        tags = text.extract(descr, " tagged with ", " online for free ")[0]
+        tags = text.extr(descr, " tagged with ", " online for free ")
         if tags:
             tags = tags.split(", ")
             tags[-1] = tags[-1].partition(" ")[2]
@@ -176,7 +176,7 @@
             embed_url = text.extract(page, 'src="', '"', pos)[0].replace(
                 "embedplayer.php?link=", "embed.php?name=")
             embed_page = self.request(embed_url).text
-            video_url = text.extract(embed_page, '"file":"', '"')[0]
+            video_url = text.extr(embed_page, '"file":"', '"')
             title, _, episode = title.rpartition(" Episode ")
 
         if video_url.startswith("//"):
diff -Nru gallery-dl-1.23.2/gallery_dl/extractor/skeb.py gallery-dl-1.24.0/gallery_dl/extractor/skeb.py
--- gallery-dl-1.23.2/gallery_dl/extractor/skeb.py	2022-09-30 14:46:45.000000000 +0000
+++ gallery-dl-1.24.0/gallery_dl/extractor/skeb.py	2022-11-08 16:10:24.000000000 +0000
@@ -77,9 +77,6 @@
             "body"             : resp["body"],
             "source_body"      : resp["source_body"],
             "translated_body"  : resp["translated"],
-            "completed_at"     : resp["completed_at"],
-            "date"             : text.parse_datetime(
-                resp["completed_at"], "%Y-%m-%dT%H:%M:%S.%fZ"),
             "nsfw"             : resp["nsfw"],
             "anonymous"        : resp["anonymous"],
             "tags"             : resp["tag_list"],
@@ -160,7 +157,6 @@
                 "name": str,
                 "screen_name": "minato_ragi",
             },
-            "completed_at": "2022-02-27T14:03:45.442Z",
             "content_category": "preview",
             "creator": {
                 "avatar_url": "https://pbs.twimg.com/profile_images"
@@ -171,7 +167,6 @@
                 "name": "イチノセ奏",
                 "screen_name": "kanade_cocotte",
             },
-            "date": "dt:2022-02-27 14:03:45",
             "file_id": int,
             "file_url": str,
             "genre": "art",
@@ -212,7 +207,7 @@
         "pattern": r"https://skeb\.imgix\.net/uploads/origins/[\w-]+"
                    r"\?bg=%23fff&auto=format&txtfont=bold&txtshad=70"
                    r"&txtclr=BFFFFFFF&txtalign=middle%2Ccenter&txtsize=150"
-                   r"&txt=SAMPLE&w=800&s=\w+",
+                   r"&txt=SAMPLE&fm=webp&w=800&s=\w+",
         "range": "1-5",
     })
 
diff -Nru gallery-dl-1.23.2/gallery_dl/extractor/subscribestar.py gallery-dl-1.24.0/gallery_dl/extractor/subscribestar.py
--- gallery-dl-1.23.2/gallery_dl/extractor/subscribestar.py	2022-06-03 19:54:20.000000000 +0000
+++ gallery-dl-1.24.0/gallery_dl/extractor/subscribestar.py	2022-11-10 12:38:30.000000000 +0000
@@ -89,23 +89,23 @@
     def _media_from_post(html):
         media = []
 
-        gallery = text.extract(html, 'data-gallery="', '"')[0]
+        gallery = text.extr(html, 'data-gallery="', '"')
         if gallery:
             media.extend(
                 item for item in json.loads(text.unescape(gallery))
                 if "/previews/" not in item["url"]
             )
 
-        attachments = text.extract(
-            html, 'class="uploads-docs"', 'data-role="post-edit_form"')[0]
+        attachments = text.extr(
+            html, 'class="uploads-docs"', 'data-role="post-edit_form"')
         if attachments:
             for att in attachments.split('class="doc_preview"')[1:]:
                 media.append({
-                    "id"  : text.parse_int(text.extract(
-                        att, 'data-upload-id="', '"')[0]),
-                    "name": text.unescape(text.extract(
-                        att, 'doc_preview-title">', '<')[0] or ""),
-                    "url" : text.unescape(text.extract(att, 'href="', '"')[0]),
+                    "id"  : text.parse_int(text.extr(
+                        att, 'data-upload-id="', '"')),
+                    "name": text.unescape(text.extr(
+                        att, 'doc_preview-title">', '<')),
+                    "url" : text.unescape(text.extr(att, 'href="', '"')),
                     "type": "attachment",
                 })
 
@@ -175,7 +175,7 @@
                 return
             yield from posts
 
-            url = text.extract(posts[-1], needle_next_page, '"')[0]
+            url = text.extr(posts[-1], needle_next_page, '"')
             if not url:
                 return
             page = self.request(self.root + text.unescape(url)).json()["html"]
diff -Nru gallery-dl-1.23.2/gallery_dl/extractor/tumblrgallery.py gallery-dl-1.24.0/gallery_dl/extractor/tumblrgallery.py
--- gallery-dl-1.23.2/gallery_dl/extractor/tumblrgallery.py	2022-05-03 10:22:33.000000000 +0000
+++ gallery-dl-1.24.0/gallery_dl/extractor/tumblrgallery.py	2022-11-10 12:38:30.000000000 +0000
@@ -46,7 +46,7 @@
 
     def metadata(self, page):
         return {
-            "title" : text.unescape(text.extract(page, "<h1>", "</h1>"))[0],
+            "title" : text.unescape(text.extr(page, "<h1>", "</h1>")),
             "gallery_id": self.gallery_id,
         }
 
@@ -82,7 +82,7 @@
     def metadata(self, page):
         return {
             "title" : text.remove_html(
-                text.unescape(text.extract(page, "<title>", "</title>")[0])
+                text.unescape(text.extr(page, "<title>", "</title>"))
             ).replace("_", "-"),
             "gallery_id": self.gallery_id,
         }
@@ -127,12 +127,12 @@
                     data = self._data_from_url(url)
                     data["gallery_id"] = gallery_id
                     data["title"] = text.remove_html(text.unescape(
-                        text.extract(post_page, "<title>", "</title>")[0]
+                        text.extr(post_page, "<title>", "</title>")
                     )).replace("_", "-")
                     yield url, data
 
-            next_url = text.extract(
-                page, '</span> <a class="btn btn-primary" href="', '"')[0]
+            next_url = text.extr(
+                page, '</span> <a class="btn btn-primary" href="', '"')
             if not next_url or page_url == next_url:
                 return
             page_url = next_url
diff -Nru gallery-dl-1.23.2/gallery_dl/extractor/tumblr.py gallery-dl-1.24.0/gallery_dl/extractor/tumblr.py
--- gallery-dl-1.23.2/gallery_dl/extractor/tumblr.py	2022-09-30 14:46:45.000000000 +0000
+++ gallery-dl-1.24.0/gallery_dl/extractor/tumblr.py	2022-11-10 12:38:30.000000000 +0000
@@ -17,7 +17,7 @@
 BASE_PATTERN = (
     r"(?:tumblr:(?:https?://)?([^/]+)|"
     r"(?:https?://)?"
-    r"(?:www\.tumblr\.com/blog/(?:view/)?([\w-]+)|"
+    r"(?:www\.tumblr\.com/(?:blog/(?:view/)?)?([\w-]+)|"
     r"([\w-]+\.tumblr\.com)))"
 )
 
@@ -49,6 +49,8 @@
         self.reblogs = self.config("reblogs", True)
         self.external = self.config("external", False)
         self.original = self.config("original", True)
+        self.fallback_delay = self.config("fallback-delay", 120.0)
+        self.fallback_retries = self.config("fallback-retries", 2)
 
         if len(self.types) == 1:
             self.api.posts_type = next(iter(self.types))
@@ -201,6 +203,15 @@
     def _prepare_image(url, post):
         text.nameext_from_url(url, post)
 
+        # try ".gifv" (#3095)
+        # it's unknown whether all gifs in this case are actually webps
+        # incorrect extensions will be corrected by 'adjust-extensions'
+        if post["extension"] == "gif":
+            post["_fallback"] = (url + "v",)
+            post["_http_headers"] = {"Accept":  # copied from chrome 106
+                                     "image/avif,image/webp,image/apng,"
+                                     "image/svg+xml,image/*,*/*;q=0.8"}
+
         parts = post["filename"].split("_")
         try:
             post["hash"] = parts[1] if parts[1] != "inline" else parts[2]
@@ -246,13 +257,13 @@
         except Exception:
             return resized, True
         else:
-            updated = text.extract(response.text, '" src="', '"')[0]
+            updated = text.extr(response.text, '" src="', '"')
             return updated, (resized == updated)
 
     def _original_image_fallback(self, url, post_id):
-        yield self._update_image_token(url)[0]
-        yield self._update_image_token(url)[0]
-        yield self._update_image_token(url)[0]
+        for _ in range(self.fallback_retries):
+            self.sleep(self.fallback_delay, "image token")
+            yield self._update_image_token(url)[0]
         self.log.warning("Unable to fetch higher-resolution "
                          "version of %s (%s)", url, post_id)
 
@@ -298,6 +309,7 @@
         ("tumblr:www.b-authentique.com"),
         ("https://www.tumblr.com/blog/view/smarties-art"),
         ("https://www.tumblr.com/blog/smarties-art"),
+        ("https://www.tumblr.com/smarties-art"),
     )
 
     def posts(self):
@@ -354,6 +366,8 @@
         }),
         ("http://demo.tumblr.com/image/459265350"),
         ("https://www.tumblr.com/blog/view/smarties-art/686047436641353728"),
+        ("https://www.tumblr.com/blog/smarties-art/686047436641353728"),
+        ("https://www.tumblr.com/smarties-art/686047436641353728"),
     )
 
     def __init__(self, match):
@@ -381,6 +395,8 @@
             "count": 1,
         }),
         ("https://www.tumblr.com/blog/view/smarties-art/tagged/undertale"),
+        ("https://www.tumblr.com/blog/smarties-art/tagged/undertale"),
+        ("https://www.tumblr.com/smarties-art/tagged/undertale"),
     )
 
     def __init__(self, match):
@@ -402,6 +418,8 @@
             "count": 1,
         }),
         ("https://www.tumblr.com/blog/view/mikf123/likes"),
+        ("https://www.tumblr.com/blog/mikf123/likes"),
+        ("https://www.tumblr.com/mikf123/likes"),
     )
 
     def posts(self):
@@ -435,11 +453,15 @@
 
     def posts(self, blog, params):
         """Retrieve published posts"""
-        params.update({"offset": 0, "limit": 50, "reblog_info": "true"})
+        params["offset"] = self.extractor.config("offset") or 0
+        params["limit"] = 50
+        params["reblog_info"] = "true"
+
         if self.posts_type:
             params["type"] = self.posts_type
         if self.before:
             params["before"] = self.before
+
         while True:
             data = self._call(blog, "posts", params)
             self.BLOG_CACHE[blog] = data["blog"]
diff -Nru gallery-dl-1.23.2/gallery_dl/extractor/twibooru.py gallery-dl-1.24.0/gallery_dl/extractor/twibooru.py
--- gallery-dl-1.23.2/gallery_dl/extractor/twibooru.py	2022-07-12 13:49:22.000000000 +0000
+++ gallery-dl-1.24.0/gallery_dl/extractor/twibooru.py	2022-11-10 12:38:30.000000000 +0000
@@ -83,7 +83,7 @@
             "tag_ids": list,
             "tags": list,
             "thumbnails_generated": True,
-            "updated_at": "2022-05-13T00:43:19.791Z",
+            "updated_at": "2022-09-21T14:31:50.441Z",
             "upvotes": int,
             "view_url": "https://cdn.twibooru.org/img/2020/7/8/1/full.png",
             "width": 576,
diff -Nru gallery-dl-1.23.2/gallery_dl/extractor/twitter.py gallery-dl-1.24.0/gallery_dl/extractor/twitter.py
--- gallery-dl-1.23.2/gallery_dl/extractor/twitter.py	2022-09-30 14:46:45.000000000 +0000
+++ gallery-dl-1.24.0/gallery_dl/extractor/twitter.py	2022-11-19 22:09:38.000000000 +0000
@@ -14,10 +14,7 @@
 import itertools
 import json
 
-BASE_PATTERN = (
-    r"(?:https?://)?(?:www\.|mobile\.)?"
-    r"(?:(?:[fv]x)?twitter\.com|nitter\.net)"
-)
+BASE_PATTERN = r"(?:https?://)?(?:www\.|mobile\.)?(?:[fv]x)?twitter\.com"
 
 
 class TwitterExtractor(Extractor):
@@ -227,8 +224,8 @@
                 response = self.request(url, fatal=False)
                 if response.status_code >= 400:
                     continue
-                url = text.extract(
-                    response.text, 'name="twitter:image" value="', '"')[0]
+                url = text.extr(
+                    response.text, 'name="twitter:image" value="', '"')
                 if url:
                     files.append({"url": url})
 
@@ -377,6 +374,24 @@
                 except Exception:
                     yield tweet
 
+    def _make_tweet(self, user, id_str, url, timestamp):
+        return {
+            "created_at": text.parse_timestamp(timestamp).strftime(
+                "%a %b %d %H:%M:%S +0000 %Y"),
+            "id_str": id_str,
+            "lang": None,
+            "user": user,
+            "entities": {},
+            "extended_entities": {
+                "media": [
+                    {
+                        "original_info": {},
+                        "media_url": url,
+                    },
+                ],
+            },
+        }
+
     def metadata(self):
         """Return general metadata"""
         return {}
@@ -388,44 +403,7 @@
         if not self._check_cookies(self.cookienames):
             username, password = self._get_auth_info()
             if username:
-                self._update_cookies(self._login_impl(username, password))
-
-    @cache(maxage=360*24*3600, keyarg=1)
-    def _login_impl(self, username, password):
-        self.log.info("Logging in as %s", username)
-
-        token = util.generate_token()
-        self.session.cookies.clear()
-        self.request(self.root + "/login")
-
-        url = self.root + "/sessions"
-        cookies = {
-            "_mb_tk": token,
-        }
-        data = {
-            "redirect_after_login"      : "/",
-            "remember_me"               : "1",
-            "authenticity_token"        : token,
-            "wfa"                       : "1",
-            "ui_metrics"                : "{}",
-            "session[username_or_email]": username,
-            "session[password]"         : password,
-        }
-        response = self.request(
-            url, method="POST", cookies=cookies, data=data)
-
-        if "/account/login_verification" in response.url:
-            raise exception.AuthenticationError(
-                "Login with two-factor authentication is not supported")
-
-        cookies = {
-            cookie.name: cookie.value
-            for cookie in self.session.cookies
-        }
-
-        if "/error" in response.url or "auth_token" not in cookies:
-            raise exception.AuthenticationError()
-        return cookies
+                self._update_cookies(_login_impl(self, username, password))
 
 
 class TwitterTimelineExtractor(TwitterExtractor):
@@ -727,11 +705,6 @@
             "pattern": r"https://\w+.cloudfront.net/photos/large/\d+.jpg",
             "count": 3,
         }),
-        # Nitter tweet (#890)
-        ("https://nitter.net/ed1conf/status/1163841619336007680", {
-            "url": "4a9ea898b14d3c112f98562d0df75c9785e239d9",
-            "content": "f29501e44d88437fe460f5c927b7543fda0f6e34",
-        }),
         # Twitter card (#1005)
         ("https://twitter.com/billboard/status/1306599586602135555", {
             "options": (("cards", True),),
@@ -850,6 +823,76 @@
         return itertools.chain(buffer, tweets)
 
 
+class TwitterAvatarExtractor(TwitterExtractor):
+    subcategory = "avatar"
+    filename_fmt = "avatar {date}.{extension}"
+    archive_fmt = "AV_{user[id]}_{date}"
+    pattern = BASE_PATTERN + r"/(?!search)([^/?#]+)/photo"
+    test = (
+        ("https://twitter.com/supernaturepics/photo", {
+            "pattern": r"https://pbs\.twimg\.com/profile_images"
+                       r"/554585280938659841/FLVAlX18\.jpeg",
+            "keyword": {
+                "date": "dt:2015-01-12 10:26:49",
+                "extension": "jpeg",
+                "filename": "FLVAlX18",
+                "tweet_id": 554585280938659841,
+            },
+        }),
+        ("https://twitter.com/User16/photo", {
+            "count": 0,
+        }),
+    )
+
+    def tweets(self):
+        self.api._user_id_by_screen_name(self.user)
+        user = self._user_obj
+        url = user["legacy"]["profile_image_url_https"]
+
+        if url == ("https://abs.twimg.com/sticky"
+                   "/default_profile_images/default_profile_normal.png"):
+            return ()
+
+        url = url.replace("_normal.", ".")
+        id_str = url.rsplit("/", 2)[1]
+        timestamp = ((int(id_str) >> 22) + 1288834974657) // 1000
+
+        return (self._make_tweet(user, id_str, url, timestamp),)
+
+
+class TwitterBackgroundExtractor(TwitterExtractor):
+    subcategory = "background"
+    filename_fmt = "background {date}.{extension}"
+    archive_fmt = "BG_{user[id]}_{date}"
+    pattern = BASE_PATTERN + r"/(?!search)([^/?#]+)/header_photo"
+    test = (
+        ("https://twitter.com/supernaturepics/header_photo", {
+            "pattern": r"https://pbs\.twimg\.com/profile_banners"
+                       r"/2976459548/1421058583",
+            "keyword": {
+                "date": "dt:2015-01-12 10:29:43",
+                "filename": "1421058583",
+                "tweet_id": 0,
+            },
+        }),
+        ("https://twitter.com/User16/header_photo", {
+            "count": 0,
+        }),
+    )
+
+    def tweets(self):
+        self.api._user_id_by_screen_name(self.user)
+        user = user = self._user_obj
+
+        try:
+            url = user["legacy"]["profile_banner_url"]
+            _, timestamp = url.rsplit("/", 1)
+        except (KeyError, ValueError):
+            return ()
+
+        return (self._make_tweet(user, None, url, timestamp),)
+
+
 class TwitterImageExtractor(Extractor):
     category = "twitter"
     subcategory = "image"
@@ -1021,7 +1064,7 @@
             "count": 100,
         }
         return self._pagination_tweets(
-            endpoint, variables, ("bookmark_timeline", "timeline"))
+            endpoint, variables, ("bookmark_timeline", "timeline"), False)
 
     def list_latest_tweets_timeline(self, list_id):
         endpoint = "/graphql/z3l-EHlx-fyg8OvGO4JN8A/ListLatestTweetsTimeline"
@@ -1253,7 +1296,8 @@
                 return
             params["cursor"] = cursor
 
-    def _pagination_tweets(self, endpoint, variables, path=None):
+    def _pagination_tweets(self, endpoint, variables,
+                           path=None, stop_tweets=True):
         extr = self.extractor
         variables.update(self.variables)
         original_retweets = (extr.retweets == "original")
@@ -1397,7 +1441,9 @@
                             tweet.get("rest_id"))
                         continue
 
-            if not tweet or not cursor:
+            if stop_tweets and not tweet:
+                return
+            if not cursor or cursor == variables.get("cursor"):
                 return
             variables["cursor"] = cursor
 
@@ -1456,8 +1502,8 @@
         self.extractor.log.debug("Skipping %s (\"%s\")", tweet_id, text)
 
     def _syndication_tweet(self, tweet_id):
-        tweet = self.extractor.request(
-            "https://cdn.syndication.twimg.com/tweet?id=" + tweet_id).json()
+        base_url = "https://cdn.syndication.twimg.com/tweet-result?id="
+        tweet = self.extractor.request(base_url + tweet_id).json()
 
         tweet["user"]["description"] = ""
         tweet["user"]["entities"] = {"description": {}}
@@ -1500,3 +1546,174 @@
             "core"   : {"user_results": {"result": tweet["user"]}},
             "_retweet_id_str": retweet_id,
         }
+
+
+@cache(maxage=360*86400, keyarg=1)
+def _login_impl(extr, username, password):
+
+    import re
+    import random
+
+    if re.fullmatch(r"[\w.%+-]+@[\w.-]+\.\w{2,}", username):
+        extr.log.warning(
+            "Login with email is no longer possible. "
+            "You need to provide your username or phone number instead.")
+
+    extr.log.info("Logging in as %s", username)
+
+    def process(response):
+        try:
+            data = response.json()
+        except ValueError:
+            data = {"errors": ({"message": "Invalid response"},)}
+        else:
+            if response.status_code < 400:
+                return data["flow_token"]
+
+        errors = []
+        for error in data.get("errors") or ():
+            msg = error.get("message")
+            errors.append('"{}"'.format(msg) if msg else "Unknown error")
+        extr.log.debug(response.text)
+        raise exception.AuthenticationError(", ".join(errors))
+
+    extr.session.cookies.clear()
+    api = TwitterAPI(extr)
+    headers = api.headers
+    headers["Referer"] = "https://twitter.com/i/flow/login"
+
+    # init
+    data = {
+        "input_flow_data": {
+            "flow_context": {
+                "debug_overrides": {},
+                "start_location": {"location": "unknown"},
+            },
+        },
+        "subtask_versions": {
+            "action_list": 2,
+            "alert_dialog": 1,
+            "app_download_cta": 1,
+            "check_logged_in_account": 1,
+            "choice_selection": 3,
+            "contacts_live_sync_permission_prompt": 0,
+            "cta": 7,
+            "email_verification": 2,
+            "end_flow": 1,
+            "enter_date": 1,
+            "enter_email": 2,
+            "enter_password": 5,
+            "enter_phone": 2,
+            "enter_recaptcha": 1,
+            "enter_text": 5,
+            "enter_username": 2,
+            "generic_urt": 3,
+            "in_app_notification": 1,
+            "interest_picker": 3,
+            "js_instrumentation": 1,
+            "menu_dialog": 1,
+            "notifications_permission_prompt": 2,
+            "open_account": 2,
+            "open_home_timeline": 1,
+            "open_link": 1,
+            "phone_verification": 4,
+            "privacy_options": 1,
+            "security_key": 3,
+            "select_avatar": 4,
+            "select_banner": 2,
+            "settings_list": 7,
+            "show_code": 1,
+            "sign_up": 2,
+            "sign_up_review": 4,
+            "tweet_selection_urt": 1,
+            "update_users": 1,
+            "upload_media": 1,
+            "user_recommendations_list": 4,
+            "user_recommendations_urt": 1,
+            "wait_spinner": 3,
+            "web_modal": 1,
+        },
+    }
+    url = "https://twitter.com/i/api/1.1/onboarding/task.json?flow_name=login"
+    response = extr.request(url, method="POST", headers=headers, json=data)
+
+    data = {
+        "flow_token": process(response),
+        "subtask_inputs": [
+            {
+                "subtask_id": "LoginJsInstrumentationSubtask",
+                "js_instrumentation": {
+                    "response": "{}",
+                    "link": "next_link",
+                },
+            },
+        ],
+    }
+    url = "https://twitter.com/i/api/1.1/onboarding/task.json"
+    response = extr.request(
+        url, method="POST", headers=headers, json=data, fatal=None)
+
+    # username
+    data = {
+        "flow_token": process(response),
+        "subtask_inputs": [
+            {
+                "subtask_id": "LoginEnterUserIdentifierSSO",
+                "settings_list": {
+                    "setting_responses": [
+                        {
+                            "key": "user_identifier",
+                            "response_data": {
+                                "text_data": {"result": username},
+                            },
+                        },
+                    ],
+                    "link": "next_link",
+                },
+            },
+        ],
+    }
+    #  url = "https://twitter.com/i/api/1.1/onboarding/task.json"
+    extr.sleep(random.uniform(2.0, 4.0), "login (username)")
+    response = extr.request(
+        url, method="POST", headers=headers, json=data, fatal=None)
+
+    # password
+    data = {
+        "flow_token": process(response),
+        "subtask_inputs": [
+            {
+                "subtask_id": "LoginEnterPassword",
+                "enter_password": {
+                    "password": password,
+                    "link": "next_link",
+                },
+            },
+        ],
+    }
+    #  url = "https://twitter.com/i/api/1.1/onboarding/task.json"
+    extr.sleep(random.uniform(2.0, 4.0), "login (password)")
+    response = extr.request(
+        url, method="POST", headers=headers, json=data, fatal=None)
+
+    # account duplication check ?
+    data = {
+        "flow_token": process(response),
+        "subtask_inputs": [
+            {
+                "subtask_id": "AccountDuplicationCheck",
+                "check_logged_in_account": {
+                    "link": "AccountDuplicationCheck_false",
+                },
+            },
+        ],
+    }
+    #  url = "https://twitter.com/i/api/1.1/onboarding/task.json"
+    response = extr.request(
+        url, method="POST", headers=headers, json=data, fatal=None)
+    process(response)
+
+    return {
+        cookie.name: cookie.value
+        for cookie in extr.session.cookies
+    }
diff -Nru gallery-dl-1.23.2/gallery_dl/extractor/unsplash.py gallery-dl-1.24.0/gallery_dl/extractor/unsplash.py
--- gallery-dl-1.23.2/gallery_dl/extractor/unsplash.py	2022-08-27 21:07:29.000000000 +0000
+++ gallery-dl-1.24.0/gallery_dl/extractor/unsplash.py	2022-11-08 16:10:24.000000000 +0000
@@ -210,7 +210,7 @@
 class UnsplashSearchExtractor(UnsplashExtractor):
     """Extractor for unsplash search results"""
     subcategory = "search"
-    pattern = BASE_PATTERN + r"/s/photos/([^/?#]+)(?:\?([^/?#]+))?"
+    pattern = BASE_PATTERN + r"/s/photos/([^/?#]+)(?:\?([^#]+))?"
     test = ("https://unsplash.com/s/photos/hair-style", {
         "pattern": r"https://images\.unsplash\.com/((flagged/)?photo-\d+-\w+"
                    r"|reserve/[^/?#]+)\?ixid=\w+&ixlib=rb-1\.2\.1$",
diff -Nru gallery-dl-1.23.2/gallery_dl/extractor/uploadir.py gallery-dl-1.24.0/gallery_dl/extractor/uploadir.py
--- gallery-dl-1.23.2/gallery_dl/extractor/uploadir.py	1970-01-01 00:00:00.000000000 +0000
+++ gallery-dl-1.24.0/gallery_dl/extractor/uploadir.py	2022-11-10 12:38:30.000000000 +0000
@@ -0,0 +1,90 @@
+# -*- coding: utf-8 -*-
+
+# Copyright 2022 Mike Fährmann
+#
+# This program is free software; you can redistribute it and/or modify
+# it under the terms of the GNU General Public License version 2 as
+# published by the Free Software Foundation.
+
+"""Extractors for https://uploadir.com/"""
+
+from .common import Extractor, Message
+from .. import text
+
+
+class UploadirFileExtractor(Extractor):
+    """Extractor for uploadir files"""
+    category = "uploadir"
+    subcategory = "file"
+    root = "https://uploadir.com"
+    filename_fmt = "{filename} ({id}).{extension}"
+    archive_fmt = "{id}"
+    pattern = r"(?:https?://)?uploadir\.com/(?:user/)?u(?:ploads)?/([^/?#]+)"
+    test = (
+        # image
+        ("https://uploadir.com/u/rd3t46ry", {
+            "pattern": r"https://uploadir\.com/u/rd3t46ry",
+            "count": 1,
+            "keyword": {
+                "extension": "jpg",
+                "filename": "Chloe and Rachel 4K jpg",
+                "id": "rd3t46ry",
+            },
+        }),
+        # archive
+        ("https://uploadir.com/uploads/gxe8ti9v/downloads/new", {
+            "pattern": r"https://uploadir\.com/uploads/gxe8ti9v/downloads",
+            "count": 1,
+            "keyword": {
+                "extension": "zip",
+                "filename": "NYAN-Mods-Pack#1",
+                "id": "gxe8ti9v",
+            },
+        }),
+        # utf-8 filename
+        ("https://uploadir.com/u/fllda6xl", {
+            "pattern": r"https://uploadir\.com/u/fllda6xl",
+            "count": 1,
+            "keyword": {
+                "extension": "png",
+                "filename": "_圖片_🖼_image_",
+                "id": "fllda6xl",
+            },
+        }),
+        ("https://uploadir.com/uploads/rd3t46ry"),
+        ("https://uploadir.com/user/uploads/rd3t46ry"),
+    )
+
+    def __init__(self, match):
+        Extractor.__init__(self, match)
+        self.file_id = match.group(1)
+
+    def items(self):
+        url = "{}/u/{}".format(self.root, self.file_id)
+        response = self.request(url, method="HEAD", allow_redirects=False)
+
+        if 300 <= response.status_code < 400:
+            url = response.headers["Location"]
+            extr = text.extract_from(self.request(url).text)
+
+            name = text.unescape(extr("<h2>", "</h2>").strip())
+            url = self.root + extr('class="form" action="', '"')
+            token = extr('name="authenticity_token" value="', '"')
+
+            data = text.nameext_from_url(name, {
+                "_http_method": "POST",
+                "_http_data"  : {
+                    "authenticity_token": token,
+                    "upload_id": self.file_id,
+                },
+            })
+
+        else:
+            hcd = response.headers.get("Content-Disposition")
+            name = (hcd.partition("filename*=UTF-8''")[2] or
+                    text.extr(hcd, 'filename="', '"'))
+            data = text.nameext_from_url(name)
+
+        data["id"] = self.file_id
+        yield Message.Directory, data
+        yield Message.Url, url, data
diff -Nru gallery-dl-1.23.2/gallery_dl/extractor/vanillarock.py gallery-dl-1.24.0/gallery_dl/extractor/vanillarock.py
--- gallery-dl-1.23.2/gallery_dl/extractor/vanillarock.py	2022-02-01 23:09:19.000000000 +0000
+++ gallery-dl-1.24.0/gallery_dl/extractor/vanillarock.py	2022-11-10 12:38:30.000000000 +0000
@@ -44,7 +44,7 @@
             img = extr('<div class="main-img">', '</div>')
             if not img:
                 break
-            imgs.append(text.extract(img, 'href="', '"')[0])
+            imgs.append(text.extr(img, 'href="', '"'))
 
         data = {
             "count": len(imgs),
@@ -89,5 +89,5 @@
                 post = extr('<h2 class="entry-title">', '</h2>')
                 if not post:
                     break
-                yield Message.Queue, text.extract(post, 'href="', '"')[0], data
+                yield Message.Queue, text.extr(post, 'href="', '"'), data
             url = text.unescape(extr('class="next page-numbers" href="', '"'))
diff -Nru gallery-dl-1.23.2/gallery_dl/extractor/vichan.py gallery-dl-1.24.0/gallery_dl/extractor/vichan.py
--- gallery-dl-1.23.2/gallery_dl/extractor/vichan.py	1970-01-01 00:00:00.000000000 +0000
+++ gallery-dl-1.24.0/gallery_dl/extractor/vichan.py	2022-11-08 16:10:24.000000000 +0000
@@ -0,0 +1,163 @@
+# -*- coding: utf-8 -*-
+
+# Copyright 2022 Mike Fährmann
+#
+# This program is free software; you can redistribute it and/or modify
+# it under the terms of the GNU General Public License version 2 as
+# published by the Free Software Foundation.
+
+"""Extractors for vichan imageboards"""
+
+from .common import BaseExtractor, Message
+from .. import text
+
+
+class VichanExtractor(BaseExtractor):
+    """Base class for vichan extractors"""
+    basecategory = "vichan"
+
+
+BASE_PATTERN = VichanExtractor.update({
+    "8kun": {
+        "root": "https://8kun.top",
+        "pattern": r"8kun\.top",
+    },
+    "wikieat": {
+        "root": "https://wikieat.club",
+        "pattern": r"wikieat\.club",
+    },
+    "smugloli": {
+        "root": None,
+        "pattern": r"smuglo(?:\.li|li\.net)",
+    },
+})
+
+
+class VichanThreadExtractor(VichanExtractor):
+    """Extractor for vichan threads"""
+    subcategory = "thread"
+    directory_fmt = ("{category}", "{board}", "{thread} {title}")
+    filename_fmt = "{time}{num:?-//} {filename}.{extension}"
+    archive_fmt = "{board}_{thread}_{tim}"
+    pattern = BASE_PATTERN + r"/([^/?#]+)/res/(\d+)"
+    test = (
+        ("https://8kun.top/test/res/65248.html", {
+            "pattern": r"https://media\.128ducks\.com/file_store/\w{64}\.\w+",
+            "count": ">= 8",
+        }),
+        # old-style file URLs (#1101)
+        #  ("https://8kun.top/d/res/13258.html", {
+        #      "pattern": r"https://media\.128ducks\.com/d/src/\d+(-\d)?\.\w+",
+        #      "range": "1-20",
+        #  }),
+
+        ("https://wikieat.club/cel/res/25321.html", {
+            "pattern": r"https://wikieat\.club/cel/src/\d+(-\d)?\.\w+",
+            "count": ">= 200",
+        }),
+
+        ("https://smuglo.li/a/res/1154380.html", {
+            "pattern": r"https://smug.+/a/src/\d+(-\d)?\.\w+",
+            "count": ">= 18",
+            "keyword": {
+                "board": "a",
+                "thread": "1154380",
+                "title": "Mob Psycho 100 Season 3",
+            },
+        }),
+        ("https://smugloli.net/a/res/1145409.html"),
+    )
+
+    def __init__(self, match):
+        VichanExtractor.__init__(self, match)
+        index = match.lastindex
+        self.board = match.group(index-1)
+        self.thread = match.group(index)
+
+    def items(self):
+        url = "{}/{}/res/{}.json".format(self.root, self.board, self.thread)
+        posts = self.request(url).json()["posts"]
+        title = posts[0].get("sub") or text.remove_html(posts[0]["com"])
+        process = (self._process_8kun if self.category == "8kun" else
+                   self._process)
+        data = {
+            "board" : self.board,
+            "thread": self.thread,
+            "title" : text.unescape(title)[:50],
+            "num"   : 0,
+        }
+
+        yield Message.Directory, data
+        for post in posts:
+            if "filename" in post:
+                yield process(post, data)
+                if "extra_files" in post:
+                    for post["num"], filedata in enumerate(
+                            post["extra_files"], 1):
+                        yield process(post, filedata)
+
+    def _process(self, post, data):
+        post.update(data)
+        post["extension"] = post["ext"][1:]
+        post["url"] = "{}/{}/src/{}{}".format(
+            self.root, post["board"], post["tim"], post["ext"])
+        return Message.Url, post["url"], post
+
+    @staticmethod
+    def _process_8kun(post, data):
+        post.update(data)
+        post["extension"] = post["ext"][1:]
+
+        tim = post["tim"]
+        if len(tim) > 16:
+            post["url"] = "https://media.128ducks.com/file_store/{}{}".format(
+                tim, post["ext"])
+        else:
+            post["url"] = "https://media.128ducks.com/{}/src/{}{}".format(
+                post["board"], tim, post["ext"])
+
+        return Message.Url, post["url"], post
+
+
+class VichanBoardExtractor(VichanExtractor):
+    """Extractor for vichan boards"""
+    subcategory = "board"
+    pattern = BASE_PATTERN + r"/([^/?#]+)(?:/index|/catalog|/\d+|/?$)"
+    test = (
+        ("https://8kun.top/v/index.html", {
+            "pattern": VichanThreadExtractor.pattern,
+            "count": ">= 100",
+        }),
+        ("https://8kun.top/v/2.html"),
+        ("https://8kun.top/v/index.html?PageSpeed=noscript"),
+
+        ("https://wikieat.club/cel/index.html", {
+            "pattern": VichanThreadExtractor.pattern,
+            "count": ">= 100",
+        }),
+        ("https://wikieat.club/cel/catalog.html"),
+        ("https://wikieat.club/cel/2.html"),
+
+        ("https://smuglo.li/a", {
+            "pattern": VichanThreadExtractor.pattern,
+            "count": ">= 100",
+        }),
+        ("https://smuglo.li/a/1.html"),
+        ("https://smugloli.net/cute/catalog.html"),
+    )
+
+    def __init__(self, match):
+        VichanExtractor.__init__(self, match)
+        self.board = match.group(match.lastindex)
+
+    def items(self):
+        url = "{}/{}/threads.json".format(self.root, self.board)
+        threads = self.request(url).json()
+
+        for page in threads:
+            for thread in page["threads"]:
+                url = "{}/{}/res/{}.html".format(
+                    self.root, self.board, thread["no"])
+                thread["page"] = page["page"]
+                thread["_extractor"] = VichanThreadExtractor
+                yield Message.Queue, url, thread
diff -Nru gallery-dl-1.23.2/gallery_dl/extractor/vk.py gallery-dl-1.24.0/gallery_dl/extractor/vk.py
--- gallery-dl-1.23.2/gallery_dl/extractor/vk.py	2022-08-27 20:47:02.000000000 +0000
+++ gallery-dl-1.24.0/gallery_dl/extractor/vk.py	2022-11-08 16:10:24.000000000 +0000
@@ -79,7 +79,8 @@
 
             if len(payload) < 4:
                 self.log.debug(payload)
-                raise exception.AuthorizationError(payload[0])
+                raise exception.AuthorizationError(
+                    text.unescape(payload[0]) if payload[0] else None)
 
             total = payload[1]
             photos = payload[3]
@@ -103,7 +104,7 @@
     subcategory = "photos"
     pattern = (BASE_PATTERN + r"/(?:"
                r"(?:albums|photos|id)(-?\d+)"
-               r"|(?!album-?\d+_)([^/?#]+))")
+               r"|(?!(?:album|tag)-?\d+_?)([^/?#]+))")
     test = (
         ("https://vk.com/id398982326", {
             "pattern": r"https://sun\d+-\d+\.userapi\.com/s/v1/if1"
@@ -182,9 +183,6 @@
     directory_fmt = ("{category}", "{user[id]}", "{album[id]}")
     pattern = BASE_PATTERN + r"/album(-?\d+)_(\d+)$"
     test = (
-        ("https://vk.com/album232175027_00", {
-            "count": 8,
-        }),
         ("https://vk.com/album-165740836_281339889", {
             "count": 12,
         }),
@@ -192,6 +190,9 @@
         ("https://vk.com/album-53775183_00", {
             "exception": exception.AuthorizationError,
         }),
+        ("https://vk.com/album232175027_00", {
+            "exception": exception.AuthorizationError,
+        }),
     )
 
     def __init__(self, match):
@@ -207,3 +208,25 @@
             "user": {"id": self.user_id},
             "album": {"id": self.album_id},
         }
+
+
+class VkTaggedExtractor(VkExtractor):
+    """Extractor for a vk tagged photos"""
+    subcategory = "tagged"
+    directory_fmt = ("{category}", "{user[id]}", "tags")
+    pattern = BASE_PATTERN + r"/tag(-?\d+)$"
+    test = (
+        ("https://vk.com/tag304303884", {
+            "count": 44,
+        }),
+    )
+
+    def __init__(self, match):
+        VkExtractor.__init__(self, match)
+        self.user_id = match.group(1)
+
+    def photos(self):
+        return self._pagination("tag{}".format(self.user_id))
+
+    def metadata(self):
+        return {"user": {"id": self.user_id}}
diff -Nru gallery-dl-1.23.2/gallery_dl/extractor/vsco.py gallery-dl-1.24.0/gallery_dl/extractor/vsco.py
--- gallery-dl-1.23.2/gallery_dl/extractor/vsco.py	2022-08-27 19:16:16.000000000 +0000
+++ gallery-dl-1.24.0/gallery_dl/extractor/vsco.py	2022-11-10 12:38:30.000000000 +0000
@@ -69,7 +69,7 @@
 
     def _extract_preload_state(self, url):
         page = self.request(url, notfound=self.subcategory).text
-        return json.loads(text.extract(page, "__PRELOADED_STATE__ = ", "<")[0])
+        return json.loads(text.extr(page, "__PRELOADED_STATE__ = ", "<"))
 
     def _pagination(self, url, params, token, key, extra=None):
         headers = {
diff -Nru gallery-dl-1.23.2/gallery_dl/extractor/wallhaven.py gallery-dl-1.24.0/gallery_dl/extractor/wallhaven.py
--- gallery-dl-1.23.2/gallery_dl/extractor/wallhaven.py	2022-08-27 18:29:11.000000000 +0000
+++ gallery-dl-1.24.0/gallery_dl/extractor/wallhaven.py	2022-11-15 17:15:03.000000000 +0000
@@ -19,6 +19,10 @@
     archive_fmt = "{id}"
     root = "https://wallhaven.cc"
 
+    def __init__(self, match):
+        Extractor.__init__(self, match)
+        self.api = WallhavenAPI(self)
+
     def items(self):
         metadata = self.metadata()
         for wp in self.wallpapers():
@@ -52,12 +56,13 @@
     subcategory = "search"
     directory_fmt = ("{category}", "{search[q]}")
     archive_fmt = "s_{search[q]}_{id}"
-    pattern = r"(?:https?://)?wallhaven\.cc/search(?:/?\?([^/?#]+))?"
+    pattern = r"(?:https?://)?wallhaven\.cc/search(?:/?\?([^#]+))?"
     test = (
         ("https://wallhaven.cc/search?q=touhou"),
         (("https://wallhaven.cc/search?q=id%3A87"
           "&categories=111&purity=100&sorting=date_added&order=asc&page=3"), {
-            "pattern": r"https://w.wallhaven.cc/full/\w\w/wallhaven-\w+\.\w+",
+            "pattern": (r"https://w\.wallhaven\.cc"
+                        r"/full/\w\w/wallhaven-\w+\.\w+"),
             "count": "<= 30",
         }),
     )
@@ -67,7 +72,7 @@
         self.params = text.parse_query(match.group(1))
 
     def wallpapers(self):
-        return WallhavenAPI(self).search(self.params.copy())
+        return self.api.search(self.params.copy())
 
     def metadata(self):
         return {"search": self.params}
@@ -87,12 +92,30 @@
         self.username, self.collection_id = match.groups()
 
     def wallpapers(self):
-        return WallhavenAPI(self).collection(self.username, self.collection_id)
+        return self.api.collection(self.username, self.collection_id)
 
     def metadata(self):
         return {"username": self.username, "collection_id": self.collection_id}
 
 
+class WallhavenUserExtractor(WallhavenExtractor):
+    """Extractor for a wallhaven user"""
+    subcategory = "user"
+    pattern = r"(?:https?://)?wallhaven\.cc/user/([^/?#]+)/?$"
+    test = ("https://wallhaven.cc/user/AksumkA/",)
+
+    def __init__(self, match):
+        WallhavenExtractor.__init__(self, match)
+        self.username = match.group(1)
+
+    def items(self):
+        base = "{}/user/{}/".format(self.root, self.username)
+        return self._dispatch_extractors((
+            (WallhavenUploadsExtractor    , base + "uploads"),
+            (WallhavenCollectionsExtractor, base + "favorites"),
+        ), ("uploads",))
+
+
 class WallhavenCollectionsExtractor(WallhavenExtractor):
     """Extractor for all collections of a wallhaven user"""
     subcategory = "collections"
@@ -107,13 +130,38 @@
         self.username = match.group(1)
 
     def items(self):
-        for collection in WallhavenAPI(self).collections(self.username):
+        for collection in self.api.collections(self.username):
             collection["_extractor"] = WallhavenCollectionExtractor
             url = "https://wallhaven.cc/user/{}/favorites/{}".format(
                 self.username, collection["id"])
             yield Message.Queue, url, collection
 
 
+class WallhavenUploadsExtractor(WallhavenExtractor):
+    """Extractor for all uploads of a wallhaven user"""
+    subcategory = "uploads"
+    directory_fmt = ("{category}", "{username}")
+    archive_fmt = "u_{username}_{id}"
+    pattern = r"(?:https?://)?wallhaven\.cc/user/([^/?#]+)/uploads"
+    test = ("https://wallhaven.cc/user/AksumkA/uploads", {
+        "pattern": (r"https://[^.]+\.wallhaven\.cc"
+                    r"/full/\w\w/wallhaven-\w+\.\w+"),
+        "range": "1-100",
+        "count": 100,
+    })
+
+    def __init__(self, match):
+        WallhavenExtractor.__init__(self, match)
+        self.username = match.group(1)
+
+    def wallpapers(self):
+        params = {"q": "@" + self.username}
+        return self.api.search(params.copy())
+
+    def metadata(self):
+        return {"username": self.username}
+
+
 class WallhavenImageExtractor(WallhavenExtractor):
     """Extractor for individual wallpaper on wallhaven.cc"""
     subcategory = "image"
@@ -121,7 +169,8 @@
                r"|w\.wallhaven\.cc/[a-z]+/\w\w/wallhaven-)(\w+)")
     test = (
         ("https://wallhaven.cc/w/01w334", {
-            "pattern": "https://[^.]+.wallhaven.cc/full/01/[^-]+-01w334.jpg",
+            "pattern": (r"https://[^.]+\.wallhaven\.cc"
+                        r"/full/01/wallhaven-01w334\.jpg"),
             "content": "497212679383a465da1e35bd75873240435085a2",
             "keyword": {
                 "id"         : "01w334",
@@ -159,7 +208,7 @@
         self.wallpaper_id = match.group(1)
 
     def wallpapers(self):
-        return (WallhavenAPI(self).info(self.wallpaper_id),)
+        return (self.api.info(self.wallpaper_id),)
 
 
 class WallhavenAPI():
diff -Nru gallery-dl-1.23.2/gallery_dl/extractor/warosu.py gallery-dl-1.24.0/gallery_dl/extractor/warosu.py
--- gallery-dl-1.23.2/gallery_dl/extractor/warosu.py	2022-02-01 23:09:19.000000000 +0000
+++ gallery-dl-1.24.0/gallery_dl/extractor/warosu.py	2022-11-10 12:38:30.000000000 +0000
@@ -57,8 +57,8 @@
 
     def get_metadata(self, page):
         """Collect metadata for extractor-job"""
-        boardname = text.extract(page, "<title>", "</title>")[0]
-        title = text.extract(page, 'filetitle" itemprop="name">', '<')[0]
+        boardname = text.extr(page, "<title>", "</title>")
+        title = text.extr(page, 'filetitle" itemprop="name">', '<')
         return {
             "board": self.board,
             "board_name": boardname.rpartition(" - ")[2],
@@ -68,7 +68,7 @@
 
     def posts(self, page):
         """Build a list of all post-objects"""
-        page = text.extract(page, '<div class="content">', '<table>')[0]
+        page = text.extr(page, '<div class="content">', '<table>')
         needle = '<table itemscope itemtype="http://schema.org/Comment">'
         return [self.parse(post) for post in page.split(needle)]
 
diff -Nru gallery-dl-1.23.2/gallery_dl/extractor/weasyl.py gallery-dl-1.24.0/gallery_dl/extractor/weasyl.py
--- gallery-dl-1.23.2/gallery_dl/extractor/weasyl.py	2022-05-30 10:58:03.000000000 +0000
+++ gallery-dl-1.24.0/gallery_dl/extractor/weasyl.py	2022-11-10 12:38:30.000000000 +0000
@@ -225,7 +225,7 @@
             pos = page.index('id="favorites-content"')
 
             if not owner_login:
-                owner_login = text.extract(page, '<a href="/~', '"')[0]
+                owner_login = text.extr(page, '<a href="/~', '"')
 
             for submitid in text.extract_iter(page, "/submissions/", "/", pos):
                 if submitid == lastid:
diff -Nru gallery-dl-1.23.2/gallery_dl/extractor/webtoons.py gallery-dl-1.24.0/gallery_dl/extractor/webtoons.py
--- gallery-dl-1.23.2/gallery_dl/extractor/webtoons.py	2022-05-30 10:58:03.000000000 +0000
+++ gallery-dl-1.24.0/gallery_dl/extractor/webtoons.py	2022-11-10 12:38:30.000000000 +0000
@@ -169,7 +169,7 @@
     @staticmethod
     def get_episode_urls(page):
         """Extract and return all episode urls in 'page'"""
-        page = text.extract(page, 'id="_listUl"', '</ul>')[0]
+        page = text.extr(page, 'id="_listUl"', '</ul>')
         return [
             match.group(0)
             for match in WebtoonsEpisodeExtractor.pattern.finditer(page)
diff -Nru gallery-dl-1.23.2/gallery_dl/extractor/weibo.py gallery-dl-1.24.0/gallery_dl/extractor/weibo.py
--- gallery-dl-1.23.2/gallery_dl/extractor/weibo.py	2022-08-27 18:29:11.000000000 +0000
+++ gallery-dl-1.24.0/gallery_dl/extractor/weibo.py	2022-11-10 16:11:41.000000000 +0000
@@ -37,6 +37,7 @@
         cookies = _cookie_cache()
         if cookies is not None:
             self.session.cookies.update(cookies)
+        self.session.headers["Referer"] = self.root + "/"
 
     def request(self, url, **kwargs):
         response = Extractor.request(self, url, **kwargs)
@@ -173,7 +174,7 @@
 
         page = Extractor.request(
             self, passport_url, method="POST", headers=headers, data=data).text
-        data = json.loads(text.extract(page, "(", ");")[0])["data"]
+        data = json.loads(text.extr(page, "(", ");"))["data"]
 
         passport_url = "https://passport.weibo.com/visitor/visitor"
         params = {
diff -Nru gallery-dl-1.23.2/gallery_dl/extractor/wikieat.py gallery-dl-1.24.0/gallery_dl/extractor/wikieat.py
--- gallery-dl-1.23.2/gallery_dl/extractor/wikieat.py	2022-02-01 23:09:19.000000000 +0000
+++ gallery-dl-1.24.0/gallery_dl/extractor/wikieat.py	1970-01-01 00:00:00.000000000 +0000
@@ -1,95 +0,0 @@
-# -*- coding: utf-8 -*-
-
-# Copyright 2021 Mike Fährmann
-#
-# This program is free software; you can redistribute it and/or modify
-# it under the terms of the GNU General Public License version 2 as
-# published by the Free Software Foundation.
-
-"""Extractors for https://wikieat.club/"""
-
-from .common import Extractor, Message
-from .. import text
-
-
-class WikieatThreadExtractor(Extractor):
-    """Extractor for Wikieat threads"""
-    category = "wikieat"
-    subcategory = "thread"
-    directory_fmt = ("{category}", "{board}", "{thread} {title}")
-    filename_fmt = "{time}{num:?-//} {filename}.{extension}"
-    archive_fmt = "{board}_{thread}_{tim}"
-    pattern = r"(?:https?://)?wikieat\.club/([^/]+)/res/(\d+)"
-    test = ("https://wikieat.club/cel/res/25321.html", {
-        "pattern": r"https://wikieat\.club/cel/src/\d+(-\d)?\.\w+",
-        "count": ">= 200",
-    })
-
-    def __init__(self, match):
-        Extractor.__init__(self, match)
-        self.board, self.thread = match.groups()
-
-    def items(self):
-        url = "https://wikieat.club/{}/res/{}.json".format(
-            self.board, self.thread)
-        posts = self.request(url).json()["posts"]
-        title = posts[0].get("sub") or text.remove_html(posts[0]["com"])
-        process = self._process
-
-        data = {
-            "board" : self.board,
-            "thread": self.thread,
-            "title" : text.unescape(title)[:50],
-            "num"   : 0,
-        }
-
-        yield Message.Directory, data
-        for post in posts:
-            if "filename" in post:
-                yield process(post, data)
-                if "extra_files" in post:
-                    for post["num"], filedata in enumerate(
-                            post["extra_files"], 1):
-                        yield process(post, filedata)
-
-    @staticmethod
-    def _process(post, data):
-        post.update(data)
-        post["extension"] = post["ext"][1:]
-        tim = post["tim"]
-        url = ("https://wikieat.club/" +
-               post["board"] + "/src/" +
-               tim + post["ext"])
-        return Message.Url, url, post
-
-
-class WikieatBoardExtractor(Extractor):
-    """Extractor for Wikieat boards"""
-    category = "wikieat"
-    subcategory = "board"
-    pattern = (r"(?:https?://)?wikieat\.club"
-               r"/([^/?#]+)/(?:index|catalog|\d+)\.html")
-    test = (
-        ("https://wikieat.club/cel/index.html", {
-            "pattern": WikieatThreadExtractor.pattern,
-            "count": ">= 100",
-        }),
-        ("https://wikieat.club/cel/catalog.html"),
-        ("https://wikieat.club/cel/2.html")
-    )
-
-    def __init__(self, match):
-        Extractor.__init__(self, match)
-        self.board = match.group(1)
-
-    def items(self):
-        url = "https://wikieat.club/{}/threads.json".format(self.board)
-        threads = self.request(url).json()
-
-        for page in threads:
-            for thread in page["threads"]:
-                url = "https://wikieat.club/{}/res/{}.html".format(
-                    self.board, thread["no"])
-                thread["page"] = page["page"]
-                thread["_extractor"] = WikieatThreadExtractor
-                yield Message.Queue, url, thread
diff -Nru gallery-dl-1.23.2/gallery_dl/extractor/xhamster.py gallery-dl-1.24.0/gallery_dl/extractor/xhamster.py
--- gallery-dl-1.23.2/gallery_dl/extractor/xhamster.py	2022-05-03 10:22:33.000000000 +0000
+++ gallery-dl-1.24.0/gallery_dl/extractor/xhamster.py	2022-11-10 12:38:30.000000000 +0000
@@ -144,8 +144,8 @@
 
     def _data(self, url):
         page = self.request(url).text
-        return json.loads(text.extract(
-            page, "window.initials=", "</script>")[0].rstrip("\n\r;"))
+        return json.loads(text.extr(
+            page, "window.initials=", "</script>").rstrip("\n\r;"))
 
 
 class XhamsterUserExtractor(XhamsterExtractor):
diff -Nru gallery-dl-1.23.2/gallery_dl/extractor/xvideos.py gallery-dl-1.24.0/gallery_dl/extractor/xvideos.py
--- gallery-dl-1.23.2/gallery_dl/extractor/xvideos.py	2022-05-03 10:22:33.000000000 +0000
+++ gallery-dl-1.24.0/gallery_dl/extractor/xvideos.py	2022-11-10 12:38:30.000000000 +0000
@@ -113,8 +113,8 @@
     def items(self):
         url = "{}/profiles/{}".format(self.root, self.user)
         page = self.request(url, notfound=self.subcategory).text
-        data = json.loads(text.extract(
-            page, "xv.conf=", ";</script>")[0])["data"]
+        data = json.loads(text.extr(
+            page, "xv.conf=", ";</script>"))["data"]
 
         if not isinstance(data["galleries"], dict):
             return
diff -Nru gallery-dl-1.23.2/gallery_dl/extractor/zerochan.py gallery-dl-1.24.0/gallery_dl/extractor/zerochan.py
--- gallery-dl-1.23.2/gallery_dl/extractor/zerochan.py	2022-09-30 14:46:45.000000000 +0000
+++ gallery-dl-1.24.0/gallery_dl/extractor/zerochan.py	2022-11-10 12:38:30.000000000 +0000
@@ -127,7 +127,7 @@
 
         while True:
             page = self.request(url, params=params).text
-            thumbs = text.extract(page, '<ul id="thumbs', '</ul>')[0]
+            thumbs = text.extr(page, '<ul id="thumbs', '</ul>')
             extr = text.extract_from(thumbs)
 
             while True:
diff -Nru gallery-dl-1.23.2/gallery_dl/__init__.py gallery-dl-1.24.0/gallery_dl/__init__.py
--- gallery-dl-1.23.2/gallery_dl/__init__.py	2022-09-30 14:46:45.000000000 +0000
+++ gallery-dl-1.24.0/gallery_dl/__init__.py	2022-11-18 16:13:49.000000000 +0000
@@ -7,7 +7,6 @@
 # published by the Free Software Foundation.
 
 import sys
-import json
 import logging
 from . import version, config, option, output, extractor, job, util, exception
 
@@ -32,81 +31,6 @@
         yield pinfo["url"]
 
 
-def parse_inputfile(file, log):
-    """Filter and process strings from an input file.
-
-    Lines starting with '#' and empty lines will be ignored.
-    Lines starting with '-' will be interpreted as a key-value pair separated
-      by an '='. where 'key' is a dot-separated option name and 'value' is a
-      JSON-parsable value. These configuration options will be applied while
-      processing the next URL.
-    Lines starting with '-G' are the same as above, except these options will
-      be applied for *all* following URLs, i.e. they are Global.
-    Everything else will be used as a potential URL.
-
-    Example input file:
-
-    # settings global options
-    -G base-directory = "/tmp/"
-    -G skip = false
-
-    # setting local options for the next URL
-    -filename="spaces_are_optional.jpg"
-    -skip    = true
-
-    https://example.org/
-
-    # next URL uses default filename and 'skip' is false.
-    https://example.com/index.htm # comment1
-    https://example.com/404.htm   # comment2
-    """
-    gconf = []
-    lconf = []
-
-    for line in file:
-        line = line.strip()
-
-        if not line or line[0] == "#":
-            # empty line or comment
-            continue
-
-        elif line[0] == "-":
-            # config spec
-            if len(line) >= 2 and line[1] == "G":
-                conf = gconf
-                line = line[2:]
-            else:
-                conf = lconf
-                line = line[1:]
-
-            key, sep, value = line.partition("=")
-            if not sep:
-                log.warning("input file: invalid <key>=<value> pair: %s", line)
-                continue
-
-            try:
-                value = json.loads(value.strip())
-            except ValueError as exc:
-                log.warning("input file: unable to parse '%s': %s", value, exc)
-                continue
-
-            key = key.strip().split(".")
-            conf.append((key[:-1], key[-1], value))
-
-        else:
-            # url
-            if " #" in line:
-                line = line.partition(" #")[0].rstrip()
-            elif "\t#" in line:
-                line = line.partition("\t#")[0].rstrip()
-            if gconf or lconf:
-                yield util.ExtendedUrl(line, gconf, lconf)
-                gconf = []
-                lconf = []
-            else:
-                yield line
-
-
 def main():
     try:
         if sys.stdout and sys.stdout.encoding.lower() != "utf-8":
@@ -194,25 +118,15 @@
             config.set(("output",), "mode", "null")
         elif args.loglevel <= logging.DEBUG:
             import platform
-            import subprocess
-            import os.path
             import requests
 
             extra = ""
             if getattr(sys, "frozen", False):
                 extra = " - Executable"
             else:
-                try:
-                    out, err = subprocess.Popen(
-                        ("git", "rev-parse", "--short", "HEAD"),
-                        stdout=subprocess.PIPE,
-                        stderr=subprocess.PIPE,
-                        cwd=os.path.dirname(os.path.abspath(__file__)),
-                    ).communicate()
-                    if out and not err:
-                        extra = " - Git HEAD: " + out.decode().rstrip()
-                except (OSError, subprocess.SubprocessError):
-                    pass
+                git_head = util.git_head()
+                if git_head:
+                    extra = " - Git HEAD: " + git_head
 
             log.debug("Version %s%s", __version__, extra)
             log.debug("Python %s - %s",
@@ -224,6 +138,8 @@
             except AttributeError:
                 pass
 
+            log.debug("Configuration Files %s", config._files)
+
         if args.list_modules:
             extractor.modules.append("")
             sys.stdout.write("\n".join(extractor.modules))
@@ -275,12 +191,13 @@
                     try:
                         if inputfile == "-":
                             if sys.stdin:
-                                urls += parse_inputfile(sys.stdin, log)
+                                urls += util.parse_inputfile(sys.stdin, log)
                             else:
-                                log.warning("input file: stdin is not readable")
+                                log.warning(
+                                    "input file: stdin is not readable")
                         else:
                             with open(inputfile, encoding="utf-8") as file:
-                                urls += parse_inputfile(file, log)
+                                urls += util.parse_inputfile(file, log)
                     except OSError as exc:
                         log.warning("input file: %s", exc)
 
@@ -311,7 +228,7 @@
                 except exception.TerminateExtraction:
                     pass
                 except exception.NoExtractorError:
-                    log.error("No suitable extractor found for '%s'", url)
+                    log.error("Unsupported URL '%s'", url)
                     retval |= 64
             return retval
 
diff -Nru gallery-dl-1.23.2/gallery_dl/job.py gallery-dl-1.24.0/gallery_dl/job.py
--- gallery-dl-1.23.2/gallery_dl/job.py	2022-08-27 18:29:11.000000000 +0000
+++ gallery-dl-1.24.0/gallery_dl/job.py	2022-11-19 10:40:12.000000000 +0000
@@ -8,7 +8,6 @@
 
 import sys
 import json
-import time
 import errno
 import logging
 import functools
@@ -33,11 +32,8 @@
         self.pathfmt = None
         self.kwdict = {}
         self.status = 0
-        self.url_key = extr.config("url-metadata")
 
-        path_key = extr.config("path-metadata")
         path_proxy = output.PathfmtProxy(self)
-
         self._logger_extra = {
             "job"      : self,
             "extractor": extr,
@@ -57,12 +53,16 @@
                 extr.category = pextr.category
                 extr.subcategory = pextr.subcategory
 
+        self.metadata_url = extr.config("url-metadata")
+        self.metadata_http = extr.config("http-metadata")
+        metadata_path = extr.config("path-metadata")
+
         # user-supplied metadata
         kwdict = extr.config("keywords")
         if kwdict:
             self.kwdict.update(kwdict)
-        if path_key:
-            self.kwdict[path_key] = path_proxy
+        if metadata_path:
+            self.kwdict[metadata_path] = path_proxy
 
         # predicates
         self.pred_url = self._prepare_predicates("image", True)
@@ -74,9 +74,10 @@
         log = extractor.log
         msg = None
 
-        sleep = util.build_duration_func(extractor.config("sleep-extractor"))
+        sleep = util.build_duration_func(
+            extractor.config("sleep-extractor"))
         if sleep:
-            time.sleep(sleep())
+            extractor.sleep(sleep(), "extractor")
 
         try:
             for msg in extractor:
@@ -120,8 +121,8 @@
         """Call the appropriate message handler"""
         if msg[0] == Message.Url:
             _, url, kwdict = msg
-            if self.url_key:
-                kwdict[self.url_key] = url
+            if self.metadata_url:
+                kwdict[self.metadata_url] = url
             if self.pred_url(url, kwdict):
                 self.update_kwdict(kwdict)
                 self.handle_url(url, kwdict)
@@ -132,8 +133,8 @@
 
         elif msg[0] == Message.Queue:
             _, url, kwdict = msg
-            if self.url_key:
-                kwdict[self.url_key] = url
+            if self.metadata_url:
+                kwdict[self.metadata_url] = url
             if self.pred_queue(url, kwdict):
                 self.handle_queue(url, kwdict)
 
@@ -154,6 +155,8 @@
         extr = self.extractor
         kwdict["category"] = extr.category
         kwdict["subcategory"] = extr.subcategory
+        if self.metadata_http:
+            kwdict.pop(self.metadata_http, None)
         if self.kwdict:
             kwdict.update(self.kwdict)
 
@@ -231,14 +234,17 @@
             self.handle_skip()
             return
 
-        if pathfmt.exists():
-            if archive:
-                archive.add(kwdict)
-            self.handle_skip()
-            return
+        if pathfmt.extension and not self.metadata_http:
+            pathfmt.build_path()
+
+            if pathfmt.exists():
+                if archive:
+                    archive.add(kwdict)
+                self.handle_skip()
+                return
 
         if self.sleep:
-            time.sleep(self.sleep())
+            self.extractor.sleep(self.sleep(), "download")
 
         # download from URL
         if not self.download(url):
@@ -283,6 +289,9 @@
         if not self.pathfmt:
             self.initialize(kwdict)
         else:
+            if "post-after" in self.hooks:
+                for callback in self.hooks["post-after"]:
+                    callback(self.pathfmt)
             self.pathfmt.set_directory(kwdict)
         if "post" in self.hooks:
             for callback in self.hooks["post"]:
@@ -337,14 +346,20 @@
             self._write_unsupported(url)
 
     def handle_finalize(self):
-        pathfmt = self.pathfmt
         if self.archive:
             self.archive.close()
+
+        pathfmt = self.pathfmt
         if pathfmt:
+            hooks = self.hooks
+            if "post-after" in hooks:
+                for callback in hooks["post-after"]:
+                    callback(pathfmt)
+
             self.extractor._store_cookies()
-            if "finalize" in self.hooks:
+            if "finalize" in hooks:
                 status = self.status
-                for callback in self.hooks["finalize"]:
+                for callback in hooks["finalize"]:
                     callback(pathfmt, status)
 
     def handle_skip(self):
@@ -526,12 +541,11 @@
     def handle_url(self, url, kwdict):
         if not kwdict["extension"]:
             kwdict["extension"] = "jpg"
-        self.pathfmt.set_filename(kwdict)
-        self.out.skip(self.pathfmt.path)
         if self.sleep:
-            time.sleep(self.sleep())
+            self.extractor.sleep(self.sleep(), "download")
         if self.archive:
             self.archive.add(kwdict)
+        self.out.skip(self.pathfmt.build_filename(kwdict))
 
     def handle_directory(self, kwdict):
         if not self.pathfmt:
@@ -548,6 +562,11 @@
     def handle_url(self, url, kwdict):
         stdout_write("\nKeywords for filenames and --filter:\n"
                      "------------------------------------\n")
+
+        if self.metadata_http and url.startswith("http"):
+            kwdict[self.metadata_http] = util.extract_headers(
+                self.extractor.request(url, method="HEAD"))
+
         self.print_kwdict(kwdict)
         raise exception.StopExtraction()
 
@@ -605,12 +624,15 @@
                 self.print_kwdict(value, key + "[", markers)
 
             elif isinstance(value, list):
-                if value and isinstance(value[0], dict):
-                    self.print_kwdict(value[0], key + "[][", markers)
+                if not value:
+                    pass
+                elif isinstance(value[0], dict):
+                    self.print_kwdict(value[0], key + "[N][", markers)
                 else:
-                    write(key + "[]\n")
-                    for val in value:
-                        write("  - " + str(val) + "\n")
+                    fmt = ("  {:>%s} {}\n" % len(str(len(value)))).format
+                    write(key + "[N]\n")
+                    for idx, val in enumerate(value, 0):
+                        write(fmt(idx, val))
 
             else:
                 # string or number
@@ -697,17 +719,18 @@
         self.ascii = config.get(("output",), "ascii", ensure_ascii)
 
         private = config.get(("output",), "private")
-        self.filter = util.identity if private else util.filter_dict
+        self.filter = dict.copy if private else util.filter_dict
 
     def run(self):
+        extractor = self.extractor
         sleep = util.build_duration_func(
-            self.extractor.config("sleep-extractor"))
+            extractor.config("sleep-extractor"))
         if sleep:
-            time.sleep(sleep())
+            extractor.sleep(sleep(), "extractor")
 
         # collect data
         try:
-            for msg in self.extractor:
+            for msg in extractor:
                 self.dispatch(msg)
         except exception.StopExtraction:
             pass
diff -Nru gallery-dl-1.23.2/gallery_dl/option.py gallery-dl-1.24.0/gallery_dl/option.py
--- gallery-dl-1.23.2/gallery_dl/option.py	2022-07-03 09:57:50.000000000 +0000
+++ gallery-dl-1.24.0/gallery_dl/option.py	2022-11-10 12:38:30.000000000 +0000
@@ -125,6 +125,11 @@
         help="Client-side IP address to bind to",
     )
     general.add_argument(
+        "--user-agent",
+        dest="user-agent", metavar="UA", action=ConfigAction,
+        help="User-Agent request header",
+    )
+    general.add_argument(
         "--clear-cache",
         dest="clear_cache", metavar="MODULE",
         help="Delete cached login sessions, cookies, etc. for MODULE "
@@ -263,6 +268,11 @@
         help="Do not download files larger than SIZE (e.g. 500k or 2.5M)",
     )
     downloader.add_argument(
+        "--chunk-size",
+        dest="chunk-size", metavar="SIZE", action=ConfigAction,
+        help="Size of in-memory data chunks (default: 32k)",
+    )
+    downloader.add_argument(
         "--no-part",
         dest="part", nargs=0, action=ConfigConstAction, const=False,
         help="Do not use .part files",
diff -Nru gallery-dl-1.23.2/gallery_dl/path.py gallery-dl-1.24.0/gallery_dl/path.py
--- gallery-dl-1.23.2/gallery_dl/path.py	2022-08-14 21:06:06.000000000 +0000
+++ gallery-dl-1.24.0/gallery_dl/path.py	2022-11-15 11:32:45.000000000 +0000
@@ -15,16 +15,16 @@
 from . import util, formatter, exception
 
 WINDOWS = util.WINDOWS
+EXTENSION_MAP = {
+    "jpeg": "jpg",
+    "jpe" : "jpg",
+    "jfif": "jpg",
+    "jif" : "jpg",
+    "jfi" : "jpg",
+}
 
 
 class PathFormat():
-    EXTENSION_MAP = {
-        "jpeg": "jpg",
-        "jpe" : "jpg",
-        "jfif": "jpg",
-        "jif" : "jpg",
-        "jfi" : "jpg",
-    }
 
     def __init__(self, extractor):
         config = extractor.config
@@ -78,7 +78,7 @@
 
         extension_map = config("extension-map")
         if extension_map is None:
-            extension_map = self.EXTENSION_MAP
+            extension_map = EXTENSION_MAP
         self.extension_map = extension_map.get
 
         restrict = config("path-restrict", "auto")
@@ -105,6 +105,9 @@
             strip = ". "
         self.strip = strip
 
+        if WINDOWS:
+            self.extended = config("path-extended", True)
+
         basedir = extractor._parentdir
         if not basedir:
             basedir = config("base-directory")
@@ -158,12 +161,14 @@
         num = 1
         try:
             while True:
-                self.prefix = str(num) + "."
-                self.set_extension(self.extension, False)
+                prefix = format(num) + "."
+                self.kwdict["extension"] = prefix + self.extension
+                self.build_path()
                 os.stat(self.realpath)  # raises OSError if file doesn't exist
                 num += 1
         except OSError:
             pass
+        self.prefix = prefix
         return False
 
     def set_directory(self, kwdict):
@@ -178,7 +183,7 @@
         else:
             self.directory = directory = self.basedirectory
 
-        if WINDOWS:
+        if WINDOWS and self.extended:
             # Enable longer-than-260-character paths
             directory = os.path.abspath(directory)
             if directory.startswith("\\\\"):
@@ -195,31 +200,26 @@
     def set_filename(self, kwdict):
         """Set general filename data"""
         self.kwdict = kwdict
-        self.temppath = self.prefix = ""
+        self.filename = self.temppath = self.prefix = ""
 
         ext = kwdict["extension"]
         kwdict["extension"] = self.extension = self.extension_map(ext, ext)
 
-        if self.extension:
-            self.build_path()
-        else:
-            self.filename = ""
-
     def set_extension(self, extension, real=True):
         """Set filename extension"""
-        extension = self.extension_map(extension, extension)
-        if real:
-            self.extension = extension
+        self.extension = extension = self.extension_map(extension, extension)
         self.kwdict["extension"] = self.prefix + extension
-        self.build_path()
 
     def fix_extension(self, _=None):
         """Fix filenames without a given filename extension"""
         if not self.extension:
-            self.set_extension("", False)
+            self.kwdict["extension"] = self.prefix + self.extension_map("", "")
+            self.build_path()
             if self.path[-1] == ".":
                 self.path = self.path[:-1]
                 self.temppath = self.realpath = self.realpath[:-1]
+        elif not self.temppath:
+            self.build_path()
         return True
 
     def build_filename(self, kwdict):
@@ -293,7 +293,9 @@
         if self.extension:
             self.temppath += ".part"
         else:
-            self.set_extension("part", False)
+            self.kwdict["extension"] = self.prefix + self.extension_map(
+                "part", "part")
+            self.build_path()
         if part_directory:
             self.temppath = os.path.join(
                 part_directory,
diff -Nru gallery-dl-1.23.2/gallery_dl/postprocessor/compare.py gallery-dl-1.24.0/gallery_dl/postprocessor/compare.py
--- gallery-dl-1.23.2/gallery_dl/postprocessor/compare.py	2022-05-03 10:22:33.000000000 +0000
+++ gallery-dl-1.24.0/gallery_dl/postprocessor/compare.py	2022-11-10 12:38:30.000000000 +0000
@@ -51,8 +51,9 @@
         num = 1
         try:
             while not self._compare(pathfmt.realpath, pathfmt.temppath):
-                pathfmt.prefix = str(num) + "."
-                pathfmt.set_extension(pathfmt.extension, False)
+                pathfmt.prefix = prefix = format(num) + "."
+                pathfmt.kwdict["extension"] = prefix + pathfmt.extension
+                pathfmt.build_path()
                 num += 1
             return self._equal(pathfmt)
         except OSError:
diff -Nru gallery-dl-1.23.2/gallery_dl/postprocessor/metadata.py gallery-dl-1.24.0/gallery_dl/postprocessor/metadata.py
--- gallery-dl-1.23.2/gallery_dl/postprocessor/metadata.py	2022-08-27 18:29:11.000000000 +0000
+++ gallery-dl-1.24.0/gallery_dl/postprocessor/metadata.py	2022-11-19 17:11:54.000000000 +0000
@@ -19,15 +19,12 @@
     def __init__(self, job, options):
         PostProcessor.__init__(self, job)
 
-        mode = options.get("mode", "json")
-        if mode == "custom":
-            self.write = self._write_custom
-            cfmt = options.get("content-format") or options.get("format")
-            if isinstance(cfmt, list):
-                cfmt = "\n".join(cfmt) + "\n"
-            self._content_fmt = formatter.parse(cfmt).format_map
-            ext = "txt"
-        elif mode == "tags":
+        mode = options.get("mode")
+        cfmt = options.get("content-format") or options.get("format")
+        omode = "w"
+        filename = None
+
+        if mode == "tags":
             self.write = self._write_tags
             ext = "txt"
         elif mode == "modify":
@@ -41,6 +38,18 @@
             self.run = self._run_delete
             self.fields = options.get("fields")
             ext = None
+        elif mode == "custom" or not mode and cfmt:
+            self.write = self._write_custom
+            if isinstance(cfmt, list):
+                cfmt = "\n".join(cfmt) + "\n"
+            self._content_fmt = formatter.parse(cfmt).format_map
+            ext = "txt"
+        elif mode == "jsonl":
+            self.write = self._write_json
+            self.indent = None
+            self.ascii = options.get("ascii", False)
+            omode = "a"
+            filename = "data.jsonl"
         else:
             self.write = self._write_json
             self.indent = options.get("indent", 4)
@@ -53,7 +62,7 @@
             sep = os.sep + (os.altsep or "")
             self._metadir = util.expand_path(directory).rstrip(sep) + os.sep
 
-        filename = options.get("filename")
+        filename = options.get("filename", filename)
         extfmt = options.get("extension-format")
         if filename:
             if filename == "-":
@@ -97,6 +106,9 @@
             self.archive = None
 
         self.mtime = options.get("mtime")
+        self.omode = options.get("open", omode)
+        self.encoding = options.get("encoding", "utf-8")
+        self.private = options.get("private", False)
 
     def run(self, pathfmt):
         archive = self.archive
@@ -107,11 +119,11 @@
         path = directory + self._filename(pathfmt)
 
         try:
-            with open(path, "w", encoding="utf-8") as fp:
+            with open(path, self.omode, encoding=self.encoding) as fp:
                 self.write(fp, pathfmt.kwdict)
         except FileNotFoundError:
             os.makedirs(directory, exist_ok=True)
-            with open(path, "w", encoding="utf-8") as fp:
+            with open(path, self.omode, encoding=self.encoding) as fp:
                 self.write(fp, pathfmt.kwdict)
 
         if archive:
@@ -198,7 +210,9 @@
         fp.write("\n".join(tags) + "\n")
 
     def _write_json(self, fp, kwdict):
-        util.dump_json(util.filter_dict(kwdict), fp, self.ascii, self.indent)
+        if not self.private:
+            kwdict = util.filter_dict(kwdict)
+        util.dump_json(kwdict, fp, self.ascii, self.indent)
 
 
 __postprocessor__ = MetadataPP
diff -Nru gallery-dl-1.23.2/gallery_dl/postprocessor/ugoira.py gallery-dl-1.24.0/gallery_dl/postprocessor/ugoira.py
--- gallery-dl-1.23.2/gallery_dl/postprocessor/ugoira.py	2022-07-01 18:55:08.000000000 +0000
+++ gallery-dl-1.24.0/gallery_dl/postprocessor/ugoira.py	2022-11-10 12:38:30.000000000 +0000
@@ -90,15 +90,17 @@
         if pathfmt.extension != "zip":
             return
 
-        if "frames" in pathfmt.kwdict:
-            self._frames = pathfmt.kwdict["frames"]
-        elif "pixiv_ugoira_frame_data" in pathfmt.kwdict:
-            self._frames = pathfmt.kwdict["pixiv_ugoira_frame_data"]["data"]
+        kwdict = pathfmt.kwdict
+        if "frames" in kwdict:
+            self._frames = kwdict["frames"]
+        elif "pixiv_ugoira_frame_data" in kwdict:
+            self._frames = kwdict["pixiv_ugoira_frame_data"]["data"]
         else:
             return
 
         if self.delete:
             pathfmt.set_extension(self.extension)
+            pathfmt.build_path()
 
     def convert(self, pathfmt):
         if not self._frames:
@@ -115,6 +117,8 @@
 
             # process frames and collect command-line arguments
             pathfmt.set_extension(self.extension)
+            pathfmt.build_path()
+
             args = self._process(pathfmt, tempdir)
             if self.args:
                 args += self.args
@@ -151,6 +155,7 @@
                     pathfmt.delete = True
                 else:
                     pathfmt.set_extension("zip")
+                    pathfmt.build_path()
 
     def _exec(self, args):
         self.log.debug(args)
diff -Nru gallery-dl-1.23.2/gallery_dl/text.py gallery-dl-1.24.0/gallery_dl/text.py
--- gallery-dl-1.23.2/gallery_dl/text.py	2022-08-27 18:29:11.000000000 +0000
+++ gallery-dl-1.24.0/gallery_dl/text.py	2022-11-10 12:38:30.000000000 +0000
@@ -120,6 +120,15 @@
         return None, pos
 
 
+def extr(txt, begin, end, default=""):
+    """Stripped-down version of 'extract()'"""
+    try:
+        first = txt.index(begin) + len(begin)
+        return txt[first:txt.index(end, first)]
+    except (ValueError, TypeError, AttributeError):
+        return default
+
+
 def rextract(txt, begin, end, pos=-1):
     try:
         lbeg = len(begin)
diff -Nru gallery-dl-1.23.2/gallery_dl/util.py gallery-dl-1.24.0/gallery_dl/util.py
--- gallery-dl-1.23.2/gallery_dl/util.py	2022-08-27 18:29:11.000000000 +0000
+++ gallery-dl-1.24.0/gallery_dl/util.py	2022-11-20 00:22:11.000000000 +0000
@@ -19,6 +19,7 @@
 import datetime
 import functools
 import itertools
+import subprocess
 import urllib.parse
 from http.cookiejar import Cookie
 from email.utils import mktime_tz, parsedate_tz
@@ -273,6 +274,39 @@
         fp.write(response.content)
 
 
+def extract_headers(response):
+    headers = response.headers
+    data = dict(headers)
+
+    hcd = headers.get("content-disposition")
+    if hcd:
+        name = text.extr(hcd, 'filename="', '"')
+        if name:
+            text.nameext_from_url(name, data)
+
+    hlm = headers.get("last-modified")
+    if hlm:
+        data["date"] = datetime.datetime(*parsedate_tz(hlm)[:6])
+
+    return data
+
+
+@functools.lru_cache(maxsize=None)
+def git_head():
+    try:
+        out, err = subprocess.Popen(
+            ("git", "rev-parse", "--short", "HEAD"),
+            stdout=subprocess.PIPE,
+            stderr=subprocess.PIPE,
+            cwd=os.path.dirname(os.path.abspath(__file__)),
+        ).communicate()
+        if out and not err:
+            return out.decode().rstrip()
+    except (OSError, subprocess.SubprocessError):
+        pass
+    return None
+
+
 def expand_path(path):
     """Expand environment variables and tildes (~)"""
     if not path:
@@ -418,6 +452,82 @@
 }
 
 
+def parse_inputfile(file, log):
+    """Filter and process strings from an input file.
+
+    Lines starting with '#' and empty lines will be ignored.
+    Lines starting with '-' will be interpreted as a key-value pair separated
+      by an '='. where 'key' is a dot-separated option name and 'value' is a
+      JSON-parsable value. These configuration options will be applied while
+      processing the next URL.
+    Lines starting with '-G' are the same as above, except these options will
+      be applied for *all* following URLs, i.e. they are Global.
+    Everything else will be used as a potential URL.
+
+    Example input file:
+
+    # settings global options
+    -G base-directory = "/tmp/"
+    -G skip = false
+
+    # setting local options for the next URL
+    -filename="spaces_are_optional.jpg"
+    -skip    = true
+
+    https://example.org/
+
+    # next URL uses default filename and 'skip' is false.
+    https://example.com/index.htm # comment1
+    https://example.com/404.htm   # comment2
+    """
+    gconf = []
+    lconf = []
+    strip_comment = None
+
+    for line in file:
+        line = line.strip()
+
+        if not line or line[0] == "#":
+            # empty line or comment
+            continue
+
+        elif line[0] == "-":
+            # config spec
+            if len(line) >= 2 and line[1] == "G":
+                conf = gconf
+                line = line[2:]
+            else:
+                conf = lconf
+                line = line[1:]
+
+            key, sep, value = line.partition("=")
+            if not sep:
+                log.warning("input file: invalid <key>=<value> pair: %s", line)
+                continue
+
+            try:
+                value = json.loads(value.strip())
+            except ValueError as exc:
+                log.warning("input file: unable to parse '%s': %s", value, exc)
+                continue
+
+            key = key.strip().split(".")
+            conf.append((key[:-1], key[-1], value))
+
+        else:
+            # url
+            if " #" in line or "\t#" in line:
+                if strip_comment is None:
+                    strip_comment = re.compile(r"\s+#.*").sub
+                line = strip_comment("", line)
+            if gconf or lconf:
+                yield ExtendedUrl(line, gconf, lconf)
+                gconf = []
+                lconf = []
+            else:
+                yield line
+
+
 class UniversalNone():
     """None-style object that supports more operations than None itself"""
     __slots__ = ()
@@ -714,11 +824,11 @@
 
         try:
             self.cursor.execute("CREATE TABLE IF NOT EXISTS archive "
-                                "(entry PRIMARY KEY) WITHOUT ROWID")
+                                "(entry TEXT PRIMARY KEY) WITHOUT ROWID")
         except sqlite3.OperationalError:
             # fallback for missing WITHOUT ROWID support (#553)
             self.cursor.execute("CREATE TABLE IF NOT EXISTS archive "
-                                "(entry PRIMARY KEY)")
+                                "(entry TEXT PRIMARY KEY)")
 
     def check(self, kwdict):
         """Return True if the item described by 'kwdict' exists in archive"""
@@ -731,4 +841,4 @@
         """Add item described by 'kwdict' to archive"""
         key = kwdict.get(self._cache_key) or self.keygen(kwdict)
         self.cursor.execute(
-            "INSERT OR IGNORE INTO archive VALUES (?)", (key,))
+            "INSERT OR IGNORE INTO archive (entry) VALUES (?)", (key,))
diff -Nru gallery-dl-1.23.2/gallery_dl/version.py gallery-dl-1.24.0/gallery_dl/version.py
--- gallery-dl-1.23.2/gallery_dl/version.py	2022-10-01 11:22:01.000000000 +0000
+++ gallery-dl-1.24.0/gallery_dl/version.py	2022-11-20 14:36:04.000000000 +0000
@@ -6,4 +6,4 @@
 # it under the terms of the GNU General Public License version 2 as
 # published by the Free Software Foundation.
 
-__version__ = "1.23.2"
+__version__ = "1.24.0"
diff -Nru gallery-dl-1.23.2/gallery_dl/ytdl.py gallery-dl-1.24.0/gallery_dl/ytdl.py
--- gallery-dl-1.23.2/gallery_dl/ytdl.py	2022-05-30 10:58:03.000000000 +0000
+++ gallery-dl-1.24.0/gallery_dl/ytdl.py	2022-11-19 10:33:09.000000000 +0000
@@ -73,7 +73,11 @@
 
     ytdlp = (module.__name__ == "yt_dlp")
     std_headers = module.std_headers
-    parse_bytes = module.FileDownloader.parse_bytes
+
+    try:
+        parse_bytes = module.parse_bytes
+    except AttributeError:
+        parse_bytes = module.FileDownloader.parse_bytes
 
     # HTTP headers
     if opts.user_agent is not None:
diff -Nru gallery-dl-1.23.2/gallery_dl.egg-info/PKG-INFO gallery-dl-1.24.0/gallery_dl.egg-info/PKG-INFO
--- gallery-dl-1.23.2/gallery_dl.egg-info/PKG-INFO	2022-10-01 11:22:01.000000000 +0000
+++ gallery-dl-1.24.0/gallery_dl.egg-info/PKG-INFO	2022-11-20 14:36:05.000000000 +0000
@@ -1,6 +1,6 @@
 Metadata-Version: 2.1
 Name: gallery-dl
-Version: 1.23.2
+Version: 1.24.0
 Summary: Command-line program to download image galleries and collections from several image hosting sites
 Home-page: https://github.com/mikf/gallery-dl
 Download-URL: https://github.com/mikf/gallery-dl/releases/latest
@@ -14,16 +14,20 @@
 Classifier: Environment :: Console
 Classifier: Intended Audience :: End Users/Desktop
 Classifier: License :: OSI Approved :: GNU General Public License v2 (GPLv2)
-Classifier: Operating System :: Microsoft :: Windows
-Classifier: Operating System :: POSIX
-Classifier: Operating System :: MacOS
+Classifier: Operating System :: OS Independent
+Classifier: Programming Language :: Python
+Classifier: Programming Language :: Python :: 3
+Classifier: Programming Language :: Python :: 3 :: Only
 Classifier: Programming Language :: Python :: 3.4
 Classifier: Programming Language :: Python :: 3.5
 Classifier: Programming Language :: Python :: 3.6
 Classifier: Programming Language :: Python :: 3.7
 Classifier: Programming Language :: Python :: 3.8
 Classifier: Programming Language :: Python :: 3.9
-Classifier: Programming Language :: Python :: 3 :: Only
+Classifier: Programming Language :: Python :: 3.10
+Classifier: Programming Language :: Python :: 3.11
+Classifier: Programming Language :: Python :: Implementation :: CPython
+Classifier: Programming Language :: Python :: Implementation :: PyPy
 Classifier: Topic :: Internet :: WWW/HTTP
 Classifier: Topic :: Multimedia :: Graphics
 Classifier: Topic :: Utilities
@@ -99,8 +103,8 @@
 Prebuilt executable files with a Python interpreter and
 required Python packages included are available for
 
-- `Windows <https://github.com/mikf/gallery-dl/releases/download/v1.23.2/gallery-dl.exe>`__
-- `Linux   <https://github.com/mikf/gallery-dl/releases/download/v1.23.2/gallery-dl.bin>`__
+- `Windows <https://github.com/mikf/gallery-dl/releases/download/v1.24.0/gallery-dl.exe>`__
+- `Linux   <https://github.com/mikf/gallery-dl/releases/download/v1.24.0/gallery-dl.bin>`__
 
 | Executables build from the latest commit can be found at
 | https://github.com/mikf/gallery-dl/actions/workflows/executables.yml
@@ -243,7 +247,6 @@
 ``idolcomplex``,
 ``imgbb``,
 ``inkbunny``,
-``instagram``,
 ``mangadex``,
 ``mangoxo``,
 ``pillowfort``,
diff -Nru gallery-dl-1.23.2/gallery_dl.egg-info/SOURCES.txt gallery-dl-1.24.0/gallery_dl.egg-info/SOURCES.txt
--- gallery-dl-1.23.2/gallery_dl.egg-info/SOURCES.txt	2022-10-01 11:22:01.000000000 +0000
+++ gallery-dl-1.24.0/gallery_dl.egg-info/SOURCES.txt	2022-11-20 14:36:05.000000000 +0000
@@ -40,12 +40,13 @@
 gallery_dl/downloader/text.py
 gallery_dl/downloader/ytdl.py
 gallery_dl/extractor/2chan.py
+gallery_dl/extractor/2chen.py
 gallery_dl/extractor/35photo.py
 gallery_dl/extractor/3dbooru.py
 gallery_dl/extractor/420chan.py
 gallery_dl/extractor/4chan.py
 gallery_dl/extractor/500px.py
-gallery_dl/extractor/8kun.py
+gallery_dl/extractor/8chan.py
 gallery_dl/extractor/8muses.py
 gallery_dl/extractor/__init__.py
 gallery_dl/extractor/adultempire.py
@@ -132,12 +133,13 @@
 gallery_dl/extractor/moebooru.py
 gallery_dl/extractor/myhentaigallery.py
 gallery_dl/extractor/myportfolio.py
+gallery_dl/extractor/nana.py
 gallery_dl/extractor/naver.py
 gallery_dl/extractor/naverwebtoon.py
 gallery_dl/extractor/newgrounds.py
-gallery_dl/extractor/ngomik.py
 gallery_dl/extractor/nhentai.py
 gallery_dl/extractor/nijie.py
+gallery_dl/extractor/nitter.py
 gallery_dl/extractor/nozomi.py
 gallery_dl/extractor/nsfwalbum.py
 gallery_dl/extractor/oauth.py
@@ -185,7 +187,9 @@
 gallery_dl/extractor/twibooru.py
 gallery_dl/extractor/twitter.py
 gallery_dl/extractor/unsplash.py
+gallery_dl/extractor/uploadir.py
 gallery_dl/extractor/vanillarock.py
+gallery_dl/extractor/vichan.py
 gallery_dl/extractor/vk.py
 gallery_dl/extractor/vsco.py
 gallery_dl/extractor/wallhaven.py
@@ -195,7 +199,6 @@
 gallery_dl/extractor/webtoons.py
 gallery_dl/extractor/weibo.py
 gallery_dl/extractor/wikiart.py
-gallery_dl/extractor/wikieat.py
 gallery_dl/extractor/xhamster.py
 gallery_dl/extractor/xvideos.py
 gallery_dl/extractor/ytdl.py
diff -Nru gallery-dl-1.23.2/PKG-INFO gallery-dl-1.24.0/PKG-INFO
--- gallery-dl-1.23.2/PKG-INFO	2022-10-01 11:22:02.010413000 +0000
+++ gallery-dl-1.24.0/PKG-INFO	2022-11-20 14:36:05.282971900 +0000
@@ -1,6 +1,6 @@
 Metadata-Version: 2.1
 Name: gallery_dl
-Version: 1.23.2
+Version: 1.24.0
 Summary: Command-line program to download image galleries and collections from several image hosting sites
 Home-page: https://github.com/mikf/gallery-dl
 Download-URL: https://github.com/mikf/gallery-dl/releases/latest
@@ -14,16 +14,20 @@
 Classifier: Environment :: Console
 Classifier: Intended Audience :: End Users/Desktop
 Classifier: License :: OSI Approved :: GNU General Public License v2 (GPLv2)
-Classifier: Operating System :: Microsoft :: Windows
-Classifier: Operating System :: POSIX
-Classifier: Operating System :: MacOS
+Classifier: Operating System :: OS Independent
+Classifier: Programming Language :: Python
+Classifier: Programming Language :: Python :: 3
+Classifier: Programming Language :: Python :: 3 :: Only
 Classifier: Programming Language :: Python :: 3.4
 Classifier: Programming Language :: Python :: 3.5
 Classifier: Programming Language :: Python :: 3.6
 Classifier: Programming Language :: Python :: 3.7
 Classifier: Programming Language :: Python :: 3.8
 Classifier: Programming Language :: Python :: 3.9
-Classifier: Programming Language :: Python :: 3 :: Only
+Classifier: Programming Language :: Python :: 3.10
+Classifier: Programming Language :: Python :: 3.11
+Classifier: Programming Language :: Python :: Implementation :: CPython
+Classifier: Programming Language :: Python :: Implementation :: PyPy
 Classifier: Topic :: Internet :: WWW/HTTP
 Classifier: Topic :: Multimedia :: Graphics
 Classifier: Topic :: Utilities
@@ -99,8 +103,8 @@
 Prebuilt executable files with a Python interpreter and
 required Python packages included are available for
 
-- `Windows <https://github.com/mikf/gallery-dl/releases/download/v1.23.2/gallery-dl.exe>`__
-- `Linux   <https://github.com/mikf/gallery-dl/releases/download/v1.23.2/gallery-dl.bin>`__
+- `Windows <https://github.com/mikf/gallery-dl/releases/download/v1.24.0/gallery-dl.exe>`__
+- `Linux   <https://github.com/mikf/gallery-dl/releases/download/v1.24.0/gallery-dl.bin>`__
 
 | Executables build from the latest commit can be found at
 | https://github.com/mikf/gallery-dl/actions/workflows/executables.yml
@@ -243,7 +247,6 @@
 ``idolcomplex``,
 ``imgbb``,
 ``inkbunny``,
-``instagram``,
 ``mangadex``,
 ``mangoxo``,
 ``pillowfort``,
diff -Nru gallery-dl-1.23.2/README.rst gallery-dl-1.24.0/README.rst
--- gallery-dl-1.23.2/README.rst	2022-10-01 11:22:01.000000000 +0000
+++ gallery-dl-1.24.0/README.rst	2022-11-20 14:36:04.000000000 +0000
@@ -66,8 +66,8 @@
 Prebuilt executable files with a Python interpreter and
 required Python packages included are available for
 
-- `Windows <https://github.com/mikf/gallery-dl/releases/download/v1.23.2/gallery-dl.exe>`__
-- `Linux   <https://github.com/mikf/gallery-dl/releases/download/v1.23.2/gallery-dl.bin>`__
+- `Windows <https://github.com/mikf/gallery-dl/releases/download/v1.24.0/gallery-dl.exe>`__
+- `Linux   <https://github.com/mikf/gallery-dl/releases/download/v1.24.0/gallery-dl.bin>`__
 
 | Executables build from the latest commit can be found at
 | https://github.com/mikf/gallery-dl/actions/workflows/executables.yml
@@ -210,7 +210,6 @@
 ``idolcomplex``,
 ``imgbb``,
 ``inkbunny``,
-``instagram``,
 ``mangadex``,
 ``mangoxo``,
 ``pillowfort``,
diff -Nru gallery-dl-1.23.2/setup.cfg gallery-dl-1.24.0/setup.cfg
--- gallery-dl-1.23.2/setup.cfg	2022-10-01 11:22:02.010413000 +0000
+++ gallery-dl-1.24.0/setup.cfg	2022-11-20 14:36:05.282971900 +0000
@@ -1,7 +1,8 @@
 [flake8]
-exclude = gallery_dl/__init__.py,gallery_dl/__main__.py,setup.py,build,scripts,archive
+exclude = build,archive
 ignore = E203,E226,W504
 per-file-ignores = 
+	setup.py: E501
 	gallery_dl/extractor/500px.py: E501
 
 [egg_info]
diff -Nru gallery-dl-1.23.2/setup.py gallery-dl-1.24.0/setup.py
--- gallery-dl-1.23.2/setup.py	2022-05-27 13:20:33.000000000 +0000
+++ gallery-dl-1.24.0/setup.py	2022-11-10 12:38:30.000000000 +0000
@@ -5,7 +5,6 @@
 import sys
 import os.path
 import warnings
-from setuptools import setup
 
 
 def read(fname):
@@ -13,6 +12,7 @@
     with open(path, encoding="utf-8") as file:
         return file.read()
 
+
 def check_file(fname):
     path = os.path.join(os.path.dirname(__file__), fname)
     if os.path.exists(path):
@@ -41,99 +41,109 @@
     ]
 ]
 
+PACKAGES = [
+    "gallery_dl",
+    "gallery_dl.extractor",
+    "gallery_dl.downloader",
+    "gallery_dl.postprocessor",
+]
+
 DESCRIPTION = ("Command-line program to download image galleries and "
                "collections from several image hosting sites")
 LONG_DESCRIPTION = read("README.rst")
 
 
-if "py2exe" in sys.argv:
-    try:
-        import py2exe
-    except ImportError:
-        sys.exit("Error importing 'py2exe'")
+def build_py2exe():
+    from py2exe import freeze
 
     # py2exe dislikes version specifiers with a trailing '-dev'
-    VERSION = VERSION.partition("-")[0]
+    VERSION_ = VERSION.partition("-")[0]
 
-    params = {
-        "console": [{
+    freeze(
+        console=[{
             "script"         : "./gallery_dl/__main__.py",
             "dest_base"      : "gallery-dl",
-            "version"        : VERSION,
+        }],
+        version_info={
+            "version"        : VERSION_,
             "description"    : DESCRIPTION,
             "comments"       : LONG_DESCRIPTION,
             "product_name"   : "gallery-dl",
-            "product_version": VERSION,
-        }],
-        "options": {"py2exe": {
-            "bundle_files": 0,
-            "compressed"  : 1,
-            "optimize"    : 1,
-            "dist_dir"    : ".",
-            "packages"    : ["gallery_dl"],
-            "includes"    : ["youtube_dl"],
-            "dll_excludes": ["w9xpopen.exe"],
-        }},
-        "zipfile": None,
-    }
+            "product_version": VERSION_,
+        },
+        options={
+            "bundle_files"   : 0,
+            "compressed"     : 1,
+            "optimize"       : 1,
+            "dist_dir"       : "./dist",
+            "packages"       : PACKAGES,
+            "includes"       : ["youtube_dl"],
+            "dll_excludes"   : ["w9xpopen.exe"],
+        },
+        zipfile=None,
+    )
 
-else:
-    params = {}
 
+def build_setuptools():
+    from setuptools import setup
 
-setup(
-    name="gallery_dl",
-    version=VERSION,
-    description=DESCRIPTION,
-    long_description=LONG_DESCRIPTION,
-    url="https://github.com/mikf/gallery-dl",
-    download_url="https://github.com/mikf/gallery-dl/releases/latest",
-    author="Mike Fährmann",
-    author_email="mike_faehrmann@web.de",
-    maintainer="Mike Fährmann",
-    maintainer_email="mike_faehrmann@web.de",
-    license="GPLv2",
-    python_requires=">=3.4",
-    install_requires=[
-        "requests>=2.11.0",
-    ],
-    extras_require={
-        "video": [
-            "youtube-dl",
+    setup(
+        name="gallery_dl",
+        version=VERSION,
+        description=DESCRIPTION,
+        long_description=LONG_DESCRIPTION,
+        url="https://github.com/mikf/gallery-dl",
+        download_url="https://github.com/mikf/gallery-dl/releases/latest",
+        author="Mike Fährmann",
+        author_email="mike_faehrmann@web.de",
+        maintainer="Mike Fährmann",
+        maintainer_email="mike_faehrmann@web.de",
+        license="GPLv2",
+        python_requires=">=3.4",
+        install_requires=[
+            "requests>=2.11.0",
         ],
-    },
-    packages=[
-        "gallery_dl",
-        "gallery_dl.extractor",
-        "gallery_dl.downloader",
-        "gallery_dl.postprocessor",
-    ],
-    entry_points={
-        "console_scripts": [
-            "gallery-dl = gallery_dl:main",
+        extras_require={
+            "video": [
+                "youtube-dl",
+            ],
+        },
+        entry_points={
+            "console_scripts": [
+                "gallery-dl = gallery_dl:main",
+            ],
+        },
+        packages=PACKAGES,
+        data_files=FILES,
+        test_suite="test",
+        keywords="image gallery downloader crawler scraper",
+        classifiers=[
+            "Development Status :: 5 - Production/Stable",
+            "Environment :: Console",
+            "Intended Audience :: End Users/Desktop",
+            "License :: OSI Approved :: GNU General Public License v2 (GPLv2)",
+            "Operating System :: OS Independent",
+            "Programming Language :: Python",
+            "Programming Language :: Python :: 3",
+            "Programming Language :: Python :: 3 :: Only",
+            "Programming Language :: Python :: 3.4",
+            "Programming Language :: Python :: 3.5",
+            "Programming Language :: Python :: 3.6",
+            "Programming Language :: Python :: 3.7",
+            "Programming Language :: Python :: 3.8",
+            "Programming Language :: Python :: 3.9",
+            "Programming Language :: Python :: 3.10",
+            "Programming Language :: Python :: 3.11",
+            "Programming Language :: Python :: Implementation :: CPython",
+            "Programming Language :: Python :: Implementation :: PyPy",
+            "Topic :: Internet :: WWW/HTTP",
+            "Topic :: Multimedia :: Graphics",
+            "Topic :: Utilities",
         ],
-    },
-    data_files=FILES,
-    keywords="image gallery downloader crawler scraper",
-    classifiers=[
-        "Development Status :: 5 - Production/Stable",
-        "Environment :: Console",
-        "Intended Audience :: End Users/Desktop",
-        "License :: OSI Approved :: GNU General Public License v2 (GPLv2)",
-        "Operating System :: Microsoft :: Windows",
-        "Operating System :: POSIX",
-        "Operating System :: MacOS",
-        "Programming Language :: Python :: 3.4",
-        "Programming Language :: Python :: 3.5",
-        "Programming Language :: Python :: 3.6",
-        "Programming Language :: Python :: 3.7",
-        "Programming Language :: Python :: 3.8",
-        "Programming Language :: Python :: 3.9",
-        "Programming Language :: Python :: 3 :: Only",
-        "Topic :: Internet :: WWW/HTTP",
-        "Topic :: Multimedia :: Graphics",
-        "Topic :: Utilities",
-    ],
-    test_suite="test",
-    **params,
-)
+    )
+
+
+if "py2exe" in sys.argv:
+    build_py2exe()
+else:
+    build_setuptools()
diff -Nru gallery-dl-1.23.2/test/test_downloader.py gallery-dl-1.24.0/test/test_downloader.py
--- gallery-dl-1.23.2/test/test_downloader.py	2022-05-03 10:22:33.000000000 +0000
+++ gallery-dl-1.24.0/test/test_downloader.py	2022-11-16 21:58:55.000000000 +0000
@@ -1,7 +1,7 @@
 #!/usr/bin/env python3
 # -*- coding: utf-8 -*-
 
-# Copyright 2018-2021 Mike Fährmann
+# Copyright 2018-2022 Mike Fährmann
 #
 # This program is free software; you can redistribute it and/or modify
 # it under the terms of the GNU General Public License version 2 as
@@ -13,9 +13,9 @@
 from unittest.mock import Mock, MagicMock, patch
 
 import re
-import base64
 import logging
 import os.path
+import binascii
 import tempfile
 import threading
 import http.server
@@ -23,6 +23,7 @@
 
 sys.path.insert(0, os.path.dirname(os.path.dirname(os.path.abspath(__file__))))
 from gallery_dl import downloader, extractor, output, config, path  # noqa E402
+from gallery_dl.downloader.http import MIME_TYPES, SIGNATURE_CHECKS # noqa E402
 
 
 class MockDownloaderModule(Mock):
@@ -130,6 +131,7 @@
         pathfmt = cls.job.pathfmt
         pathfmt.set_directory(kwdict)
         pathfmt.set_filename(kwdict)
+        pathfmt.build_path()
 
         if content:
             mode = "w" + ("b" if isinstance(content, bytes) else "")
@@ -156,6 +158,7 @@
         self.assertEqual(
             pathfmt.extension,
             expected_extension,
+            content[0:16],
         )
         self.assertEqual(
             os.path.splitext(pathfmt.realpath)[1][1:],
@@ -172,48 +175,52 @@
 
         port = 8088
         cls.address = "http://127.0.0.1:{}".format(port)
-        cls._jpg = cls.address + "/image.jpg"
-        cls._png = cls.address + "/image.png"
-        cls._gif = cls.address + "/image.gif"
-
         server = http.server.HTTPServer(("", port), HttpRequestHandler)
         threading.Thread(target=server.serve_forever, daemon=True).start()
 
+    def _run_test(self, ext, input, output,
+                  extension, expected_extension=None):
+        TestDownloaderBase._run_test(
+            self, self.address + "/" + ext, input, output,
+            extension, expected_extension)
+
     def tearDown(self):
         self.downloader.minsize = self.downloader.maxsize = None
 
     def test_http_download(self):
-        self._run_test(self._jpg, None, DATA_JPG, "jpg", "jpg")
-        self._run_test(self._png, None, DATA_PNG, "png", "png")
-        self._run_test(self._gif, None, DATA_GIF, "gif", "gif")
+        self._run_test("jpg", None, DATA["jpg"], "jpg", "jpg")
+        self._run_test("png", None, DATA["png"], "png", "png")
+        self._run_test("gif", None, DATA["gif"], "gif", "gif")
 
     def test_http_offset(self):
-        self._run_test(self._jpg, DATA_JPG[:123], DATA_JPG, "jpg", "jpg")
-        self._run_test(self._png, DATA_PNG[:12] , DATA_PNG, "png", "png")
-        self._run_test(self._gif, DATA_GIF[:1]  , DATA_GIF, "gif", "gif")
+        self._run_test("jpg", DATA["jpg"][:123], DATA["jpg"], "jpg", "jpg")
+        self._run_test("png", DATA["png"][:12] , DATA["png"], "png", "png")
+        self._run_test("gif", DATA["gif"][:1]  , DATA["gif"], "gif", "gif")
 
     def test_http_extension(self):
-        self._run_test(self._jpg, None, DATA_JPG, None, "jpg")
-        self._run_test(self._png, None, DATA_PNG, None, "png")
-        self._run_test(self._gif, None, DATA_GIF, None, "gif")
+        self._run_test("jpg", None, DATA["jpg"], None, "jpg")
+        self._run_test("png", None, DATA["png"], None, "png")
+        self._run_test("gif", None, DATA["gif"], None, "gif")
 
     def test_http_adjust_extension(self):
-        self._run_test(self._jpg, None, DATA_JPG, "png", "jpg")
-        self._run_test(self._png, None, DATA_PNG, "gif", "png")
-        self._run_test(self._gif, None, DATA_GIF, "jpg", "gif")
+        self._run_test("jpg", None, DATA["jpg"], "png", "jpg")
+        self._run_test("png", None, DATA["png"], "gif", "png")
+        self._run_test("gif", None, DATA["gif"], "jpg", "gif")
 
     def test_http_filesize_min(self):
+        url = self.address + "/gif"
         pathfmt = self._prepare_destination(None, extension=None)
         self.downloader.minsize = 100
         with self.assertLogs(self.downloader.log, "WARNING"):
-            success = self.downloader.download(self._gif, pathfmt)
+            success = self.downloader.download(url, pathfmt)
         self.assertFalse(success)
 
     def test_http_filesize_max(self):
+        url = self.address + "/jpg"
         pathfmt = self._prepare_destination(None, extension=None)
         self.downloader.maxsize = 100
         with self.assertLogs(self.downloader.log, "WARNING"):
-            success = self.downloader.download(self._jpg, pathfmt)
+            success = self.downloader.download(url, pathfmt)
         self.assertFalse(success)
 
 
@@ -237,24 +244,14 @@
 class HttpRequestHandler(http.server.BaseHTTPRequestHandler):
 
     def do_GET(self):
-        if self.path == "/image.jpg":
-            content_type = "image/jpeg"
-            output = DATA_JPG
-        elif self.path == "/image.png":
-            content_type = "image/png"
-            output = DATA_PNG
-        elif self.path == "/image.gif":
-            content_type = "image/gif"
-            output = DATA_GIF
-        else:
+        try:
+            output = DATA[self.path[1:]]
+        except KeyError:
             self.send_response(404)
             self.wfile.write(self.path.encode())
             return
 
-        headers = {
-            "Content-Type": content_type,
-            "Content-Length": len(output),
-        }
+        headers = {"Content-Length": len(output)}
 
         if "Range" in self.headers:
             status = 206
@@ -275,31 +272,79 @@
         self.wfile.write(output)
 
 
-DATA_JPG = base64.standard_b64decode("""
-/9j/4AAQSkZJRgABAQEASABIAAD/2wBD
-AAEBAQEBAQEBAQEBAQEBAQEBAQEBAQEB
-AQEBAQEBAQEBAQEBAQEBAQEBAQEBAQEB
-AQEBAQEBAQEBAQEBAQEBAQH/2wBDAQEB
-AQEBAQEBAQEBAQEBAQEBAQEBAQEBAQEB
-AQEBAQEBAQEBAQEBAQEBAQEBAQEBAQEB
-AQEBAQEBAQEBAQEBAQH/wAARCAABAAED
-AREAAhEBAxEB/8QAFAABAAAAAAAAAAAA
-AAAAAAAACv/EABQQAQAAAAAAAAAAAAAA
-AAAAAAD/xAAUAQEAAAAAAAAAAAAAAAAA
-AAAA/8QAFBEBAAAAAAAAAAAAAAAAAAAA
-AP/aAAwDAQACEQMRAD8AfwD/2Q==""")
-
-
-DATA_PNG = base64.standard_b64decode("""
-iVBORw0KGgoAAAANSUhEUgAAAAEAAAAB
-CAAAAAA6fptVAAAACklEQVQIHWP4DwAB
-AQEANl9ngAAAAABJRU5ErkJggg==""")
-
-
-DATA_GIF = base64.standard_b64decode("""
-R0lGODdhAQABAIAAAP///////ywAAAAA
-AQABAAACAkQBADs=""")
+SAMPLES = {
+    ("jpg" , binascii.a2b_base64(
+        "/9j/4AAQSkZJRgABAQEASABIAAD/2wBDAAEBAQEBAQEBAQEBAQEBAQEBAQEBAQEB"
+        "AQEBAQEBAQEBAQEBAQEBAQEBAQEBAQEBAQEBAQEBAQEBAQEBAQEBAQH/2wBDAQEB"
+        "AQEBAQEBAQEBAQEBAQEBAQEBAQEBAQEBAQEBAQEBAQEBAQEBAQEBAQEBAQEBAQEB"
+        "AQEBAQEBAQEBAQEBAQH/wAARCAABAAEDAREAAhEBAxEB/8QAFAABAAAAAAAAAAAA"
+        "AAAAAAAACv/EABQQAQAAAAAAAAAAAAAAAAAAAAD/xAAUAQEAAAAAAAAAAAAAAAAA"
+        "AAAA/8QAFBEBAAAAAAAAAAAAAAAAAAAAAP/aAAwDAQACEQMRAD8AfwD/2Q==")),
+    ("png" , binascii.a2b_base64(
+        "iVBORw0KGgoAAAANSUhEUgAAAAEAAAABCAAAAAA6fptVAAAACklEQVQIHWP4DwAB"
+        "AQEANl9ngAAAAABJRU5ErkJggg==")),
+    ("gif" , binascii.a2b_base64(
+        "R0lGODdhAQABAIAAAP///////ywAAAAAAQABAAACAkQBADs=")),
+    ("bmp" , b"BM"),
+    ("webp", b"RIFF????WEBP"),
+    ("avif", b"????ftypavif"),
+    ("avif", b"????ftypavis"),
+    ("svg" , b"<?xml"),
+    ("ico" , b"\x00\x00\x01\x00"),
+    ("cur" , b"\x00\x00\x02\x00"),
+    ("psd" , b"8BPS"),
+    ("mp4" , b"????ftypmp4"),
+    ("mp4" , b"????ftypavc1"),
+    ("mp4" , b"????ftypiso3"),
+    ("mp4" , b"????ftypM4V"),
+    ("webm", b"\x1A\x45\xDF\xA3"),
+    ("ogg" , b"OggS"),
+    ("wav" , b"RIFF????WAVE"),
+    ("mp3" , b"ID3"),
+    ("mp3" , b"\xFF\xFB"),
+    ("mp3" , b"\xFF\xF3"),
+    ("mp3" , b"\xFF\xF2"),
+    ("zip" , b"PK\x03\x04"),
+    ("zip" , b"PK\x05\x06"),
+    ("zip" , b"PK\x07\x08"),
+    ("rar" , b"Rar!\x1A\x07"),
+    ("rar" , b"\x52\x61\x72\x21\x1A\x07"),
+    ("7z"  , b"\x37\x7A\xBC\xAF\x27\x1C"),
+    ("pdf" , b"%PDF-"),
+    ("swf" , b"FWS"),
+    ("swf" , b"CWS"),
+}
+
+
+DATA = {}
+
+for ext, content in SAMPLES:
+    if ext not in DATA:
+        DATA[ext] = content
+
+for idx, (_, content) in enumerate(SAMPLES):
+    DATA["S{:>02}".format(idx)] = content
+
+
+# reverse mime types mapping
+MIME_TYPES = {
+    ext: mtype
+    for mtype, ext in MIME_TYPES.items()
+}
+
+
+def generate_tests():
+    def generate_test(idx, ext, content):
+        def test(self):
+            self._run_test("S{:>02}".format(idx), None, content, "bin", ext)
+        test.__name__ = "test_http_ext_{:>02}_{}".format(idx, ext)
+        return test
+
+    for idx, (ext, content) in enumerate(SAMPLES):
+        test = generate_test(idx, ext, content)
+        setattr(TestHTTPDownloader, test.__name__, test)
 
 
+generate_tests()
 if __name__ == "__main__":
     unittest.main()
diff -Nru gallery-dl-1.23.2/test/test_job.py gallery-dl-1.24.0/test/test_job.py
--- gallery-dl-1.23.2/test/test_job.py	2022-05-30 10:58:03.000000000 +0000
+++ gallery-dl-1.24.0/test/test_job.py	2022-11-10 12:38:30.000000000 +0000
@@ -87,10 +87,10 @@
   1
 subcategory
   test_subcategory
-tags[]
-  - foo
-  - bar
-  - テスト
+tags[N]
+  0 foo
+  1 bar
+  2 テスト
 user[id]
   123
 user[name]
diff -Nru gallery-dl-1.23.2/test/test_postprocessor.py gallery-dl-1.24.0/test/test_postprocessor.py
--- gallery-dl-1.23.2/test/test_postprocessor.py	2022-09-30 14:46:45.000000000 +0000
+++ gallery-dl-1.24.0/test/test_postprocessor.py	2022-11-10 12:38:30.000000000 +0000
@@ -97,6 +97,7 @@
         self.pathfmt = self.job.pathfmt
         self.pathfmt.set_directory(kwdict)
         self.pathfmt.set_filename(kwdict)
+        self.pathfmt.build_path()
 
         pp = postprocessor.find(self.__class__.__name__[:-4].lower())
         return pp(self.job, options)
@@ -118,6 +119,7 @@
             for ext in exts
         })
         self.pathfmt.set_extension("jpg")
+        self.pathfmt.build_path()
 
         pp.prepare(self.pathfmt)
         path = os.path.join(self.dir.name, "test", "Pictures")
@@ -150,6 +152,7 @@
             "bar": "foo/bar",
         })
         self.pathfmt.set_extension("foo")
+        self.pathfmt.build_path()
 
         pp.prepare(self.pathfmt)
         path = os.path.join(self.dir.name, "test", "foo", "bar")
@@ -267,6 +270,7 @@
         test({"mode": "custom", "content-format": "{foo}\n{missing}\n"})
         test({"mode": "custom", "content-format": ["{foo}", "{missing}"]})
         test({"mode": "custom", "format": "{foo}\n{missing}\n"})
+        test({"format": "{foo}\n{missing}\n"})
 
     def test_metadata_extfmt(self):
         pp = self._create({
diff -Nru gallery-dl-1.23.2/test/test_results.py gallery-dl-1.24.0/test/test_results.py
--- gallery-dl-1.23.2/test/test_results.py	2022-06-25 14:51:34.000000000 +0000
+++ gallery-dl-1.24.0/test/test_results.py	2022-11-08 16:10:24.000000000 +0000
@@ -324,12 +324,16 @@
 
     for category in ("danbooru", "instagram", "twitter", "subscribestar",
                      "e621", "atfbooru", "inkbunny", "tapas", "pillowfort",
-                     "mangadex"):
+                     "mangadex", "aibooru"):
         config.set(("extractor", category), "username", None)
 
     config.set(("extractor", "mastodon.social"), "access-token",
                "Blf9gVqG7GytDTfVMiyYQjwVMQaNACgf3Ds3IxxVDUQ")
 
+    config.set(("extractor", "nana"), "favkey",
+               "9237ddb82019558ea7d179e805100805"
+               "ea6aa1c53ca6885cd4c179f9fb22ead2")
+
     config.set(("extractor", "deviantart"), "client-id", "7777")
     config.set(("extractor", "deviantart"), "client-secret",
                "ff14994c744d9208e5caeec7aab4a026")
diff -Nru gallery-dl-1.23.2/test/test_text.py gallery-dl-1.24.0/test/test_text.py
--- gallery-dl-1.23.2/test/test_text.py	2022-08-27 18:29:11.000000000 +0000
+++ gallery-dl-1.24.0/test/test_text.py	2022-11-10 12:38:30.000000000 +0000
@@ -203,6 +203,24 @@
             self.assertEqual(f(txt  , value, ">")  , (None, 0))
             self.assertEqual(f(txt  , "<"  , value), (None, 0))
 
+    def test_extr(self, f=text.extr):
+        txt = "<a><b>"
+        self.assertEqual(f(txt, "X", ">"), "")
+        self.assertEqual(f(txt, "<", "X"), "")
+        self.assertEqual(f(txt, "<", ">"), "a")
+        self.assertEqual(f(txt, "><", ">"), "b")
+
+        # 'default' argument
+        self.assertEqual(f(txt, "<", "X", None), None)
+        self.assertEqual(f(txt, "<", "X", default=None), None)
+        self.assertEqual(f(txt, "<", "X", default=()), ())
+
+        # invalid arguments
+        for value in INVALID:
+            self.assertEqual(f(value, "<"  , ">")  , "")
+            self.assertEqual(f(txt  , value, ">")  , "")
+            self.assertEqual(f(txt  , "<"  , value), "")
+
     def test_rextract(self, f=text.rextract):
         txt = "<a><b>"
         self.assertEqual(f(txt, "<", ">"), ("b" , 3))