-
-
Notifications
You must be signed in to change notification settings - Fork 4
/
Copy pathdo-web-requests.php
executable file
·112 lines (101 loc) · 4.34 KB
/
do-web-requests.php
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
<?php
/************************************************************************************
*
* Sporks, the learning, scriptable Discord bot!
*
* Copyright 2019 Craig Edwards <[email protected]>
*
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*
* Sporks web request handler
*
* Whenever a javascript program requests a webpage via the get() or post() functions, it will
* insert a row for this request into the infobot_web_requests table. This script runs in a loop
* watching this table every half a second for new rows. When new rows are found, web requests
* are made (either GET or POST) and then the row updated with the resulting content and a HTTP
* status code. Certain restrictions are placed on the request to prevent abuse:
*
* 1) DNS requets can only take up to 1 second
* 2) There can be only one attempt at DNS resolution per request
* 3) The initial connection may only take 2 seconds
* 4) There can be a maximum of 3 HTTP redirections per request
* 5) The entire request may only take 5 seconds
* 6) The POST body may be a maximum of 256k. Anything longer is truncated.
* 7) The returned content may be a maximum of 1mb. Anything longer is truncated.
*
*************************************************************************************/
$settings = json_decode(file_get_contents("config.json"));
$conn = mysqli_connect($settings->dbhost, $settings->dbuser, $settings->dbpass);
if (!$conn) {
die("Can't connect to database, check config.json\n");
}
mysqli_select_db($conn, $settings->dbname);
/* For gethostbyname sanity */
putenv('RES_OPTIONS=retrans:1 retry:1 timeout:1 attempts:1');
while (true) {
$q = mysqli_query($conn, "SELECT * FROM infobot_web_requests WHERE statuscode = '000'");
while ($rs = mysqli_fetch_object($q)) {
if (preg_match('/^\{.+?\}$/im', $rs->postdata) && $rs->type == 'POST') {
$mt = "application/json";
} else {
$mt = "application/x-www-form-urlencoded";
}
if (!preg_match("/^http:\/\//i", $rs->url) && !preg_match("/^https:\/\//i", $rs->url)) {
/* Prevent access to local files, stream context may be ignored. FU PHP. */
print "Invalid url $rs->url\n";
$response = FALSE;
} else {
if (preg_match("/^http:\/\//i", $rs->url)) {
$https = false;
} else {
$https = true;
}
/* Maximum of 1 meg actually retrieved, truncated after this */
$headers = ['User-Agent: Sporks/1.2', 'Content-Type: ' . $mt];
$host = parse_url($rs->url, PHP_URL_HOST);
$ch = curl_init($rs->url);
curl_setopt_array($ch, [
CURLOPT_FOLLOWLOCATION => 1,
CURLOPT_HEADER => 0,
CURLOPT_RETURNTRANSFER => 1,
CURLOPT_CUSTOMREQUEST => $rs->type,
CURLOPT_HTTPHEADER => $headers,
CURLOPT_CONNECTTIMEOUT => 2,
CURLOPT_MAXREDIRS => 3,
CURLOPT_TIMEOUT => 5,
CURLOPT_RESOLVE => [ $host . ':' . ($https ? '443' : '80') . ':' . gethostbyname($host) ]
]);
if ($rs->type == "POST") {
curl_setopt_array($ch, [
CURLOPT_POST => 1,
CURLOPT_POSTFIELDS => $rs->postdata,
]);
}
curl_setopt($ch, CURLOPT_BUFFERSIZE, 128); // more progress info
curl_setopt($ch, CURLOPT_NOPROGRESS, false);
curl_setopt($ch, CURLOPT_PROGRESSFUNCTION, function($curlhandle, $DownloadSize, $Downloaded, $UploadSize, $Uploaded) {
return ($Downloaded > (1024 * 1024) || ($Uploaded > 1024 * 256)) ? 1 : 0;
});
$response = curl_exec($ch);
$code = curl_getinfo($ch, CURLINFO_RESPONSE_CODE);
}
if ($response === FALSE) {
mysqli_query($conn, "UPDATE infobot_web_requests SET statuscode = '999', returndata = '' WHERE channel_id = ".$rs->channel_id);
echo $rs->url . " => ". curl_error($ch) ."\n";
} else {
mysqli_query($conn, "UPDATE infobot_web_requests SET statuscode = '$code', returndata = '".mysqli_real_escape_string($conn, $response)."' WHERE channel_id = ".$rs->channel_id);
echo $rs->url . " => $code\n";
}
}
usleep(500000);
}