-
Notifications
You must be signed in to change notification settings - Fork 7
/
scrapeUE4Docs.sh
24 lines (20 loc) · 1.11 KB
/
scrapeUE4Docs.sh
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
#!/bin/bash
# These are big web sites so we need to increase the max to get everything
linkLimit="-#L500000" # Max number of links traversed
# If you are going to use the risky setting below, you need this
disableSec="--disable-security-limits" # Disable some built in security standards
# These settings attempt to speed up httrack but are RISKY
# Consider your network, the server, and other factors when adjusting.
robots="-s0" # Ignore the robots.txt limits (0 is ignore)
rateLimit="-A0" # Bitrate limit (0 means no limit)
maxConnects="-%c0" # Max connections per second (0 means no limit)
connects="-c4" # Number of simultaneous connections
httrack -%l "en" -F "Mozilla/4.5 (compatible; HTTrack 3.0x; Windows 98)" \
-%F "<!-- Mirrored from %s%s by HTTrack Website Copier/3.x, %s -->" \
https://docs.unrealengine.com:443/en-US/$1/index.html -i -O ./$2/ \
-%v ${disableSec} ${linkLimit} ${connects} ${maxConnects} ${rateLimit} ${robots} \
$3 \
+docs.unrealengine.com:443/en-US/$1/* \
+docs.unrealengine.com:443/include/* \
+docs.unrealengine.com:443/images/* \
+static-assets-prod.epicgames.com/*