• R/O
  • HTTP
  • SSH
  • HTTPS

コミット

タグ
未設定

よく使われているワード(クリックで追加)

javac++androidlinuxc#windowsobjective-ccocoa誰得qtpythonphprubygameguibathyscaphec計画中(planning stage)翻訳omegatframeworktwitterdomtestvb.netdirectxゲームエンジンbtronarduinopreviewer

XOOPS Cube Legacy base repository


コミットメタ情報

リビジョンc3718b7bff6d64f103b7b7eb380852c1ee1cec8a (tree)
日時2010-11-14 00:14:05
作者kilica <kilica@704c...>
コミッターkilica

ログメッセージ

- Fix Bug #2666664 - /class/snoopy.php is susceptible to a remote command.

git-svn-id: https://xoopscube.svn.sourceforge.net/svnroot/xoopscube/Package_Legacy/trunk@832 704cf05f-ae62-4b0e-a484-234ee0250e75

変更サマリ

差分

--- a/html/class/snoopy.php
+++ b/html/class/snoopy.php
@@ -1,1288 +1,1269 @@
1-<?php
2-
3-/*************************************************
4-
5-Snoopy - the PHP net client
6-Author: Monte Ohrt <monte@ispi.net>
7-Copyright (c): 1999-2000 ispi, all rights reserved
8-Version: 1.01
9-
10- * This library is free software; you can redistribute it and/or
11- * modify it under the terms of the GNU Lesser General Public
12- * License as published by the Free Software Foundation; either
13- * version 2.1 of the License, or (at your option) any later version.
14- *
15- * This library is distributed in the hope that it will be useful,
16- * but WITHOUT ANY WARRANTY; without even the implied warranty of
17- * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
18- * Lesser General Public License for more details.
19- *
20- * You should have received a copy of the GNU Lesser General Public
21- * License along with this library; if not, write to the Free Software
22- * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
23-
24-You may contact the author of Snoopy by e-mail at:
25-monte@ispi.net
26-
27-Or, write to:
28-Monte Ohrt
29-CTO, ispi
30-237 S. 70th suite 220
31-Lincoln, NE 68510
32-
33-The latest version of Snoopy can be obtained from:
34-http://snoopy.sourceforge.net/
35-
36-*************************************************/
37-
38-class Snoopy
39-{
40- /**** Public variables ****/
41-
42- /* user definable vars */
43-
44- var $host = "www.php.net"; // host name we are connecting to
45- var $port = 80; // port we are connecting to
46- var $host_port = ""; // port for Host Header
47- var $proxy_host = ""; // proxy host to use
48- var $proxy_port = ""; // proxy port to use
49- var $proxy_user = ""; // proxy user to use
50- var $proxy_pass = ""; // proxy password to use
51-
52- var $agent = "Snoopy v1.2.3"; // agent we masquerade as
53- var $referer = ""; // referer info to pass
54- var $cookies = array(); // array of cookies to pass
55- // $cookies["username"]="joe";
56- var $rawheaders = array(); // array of raw headers to send
57- // $rawheaders["Content-type"]="text/html";
58-
59- var $maxredirs = 5; // http redirection depth maximum. 0 = disallow
60- var $lastredirectaddr = ""; // contains address of last redirected address
61- var $offsiteok = true; // allows redirection off-site
62- var $maxframes = 0; // frame content depth maximum. 0 = disallow
63- var $expandlinks = true; // expand links to fully qualified URLs.
64- // this only applies to fetchlinks()
65- // submitlinks(), and submittext()
66- var $passcookies = true; // pass set cookies back through redirects
67- // NOTE: this currently does not respect
68- // dates, domains or paths.
69-
70- var $user = ""; // user for http authentication
71- var $pass = ""; // password for http authentication
72-
73- // http accept types
74- var $accept = "image/gif, image/x-xbitmap, image/jpeg, image/pjpeg, */*";
75-
76- var $results = ""; // where the content is put
77-
78- var $error = ""; // error messages sent here
79- var $response_code = ""; // response code returned from server
80- var $headers = array(); // headers returned from server sent here
81- var $maxlength = 500000; // max return data length (body)
82- var $read_timeout = 0; // timeout on read operations, in seconds
83- // supported only since PHP 4 Beta 4
84- // set to 0 to disallow timeouts
85- var $timed_out = false; // if a read operation timed out
86- var $status = 0; // http request status
87-
88- var $temp_dir = "/tmp"; // temporary directory that the webserver
89- // has permission to write to.
90- // under Windows, this should be C:\temp
91-
92- var $curl_path = "/usr/local/bin/curl";
93- // Snoopy will use cURL for fetching
94- // SSL content if a full system path to
95- // the cURL binary is supplied here.
96- // set to false if you do not have
97- // cURL installed. See http://curl.haxx.se
98- // for details on installing cURL.
99- // Snoopy does *not* use the cURL
100- // library functions built into php,
101- // as these functions are not stable
102- // as of this Snoopy release.
103-
104- /**** Private variables ****/
105-
106- var $_maxlinelen = 4096; // max line length (headers)
107-
108- var $_httpmethod = "GET"; // default http request method
109- var $_httpversion = "HTTP/1.0"; // default http request version
110- var $_submit_method = "POST"; // default submit method
111- var $_submit_type = "application/x-www-form-urlencoded"; // default submit type
112- var $_mime_boundary = ""; // MIME boundary for multipart/form-data submit type
113- var $_redirectaddr = false; // will be set if page fetched is a redirect
114- var $_redirectdepth = 0; // increments on an http redirect
115- var $_frameurls = array(); // frame src urls
116- var $_framedepth = 0; // increments on frame depth
117-
118- var $_isproxy = false; // set if using a proxy server
119- var $_fp_timeout = 30; // timeout for socket connection
120-
121-/*======================================================================*\
122- Function: fetch
123- Purpose: fetch the contents of a web page
124- (and possibly other protocols in the
125- future like ftp, nntp, gopher, etc.)
126- Input: $URI the location of the page to fetch
127- Output: $this->results the output text from the fetch
128-\*======================================================================*/
129-
130- function fetch($URI)
131- {
132-
133- //preg_match("|^([^:]+)://([^:/]+)(:[\d]+)*(.*)|",$URI,$URI_PARTS);
134- $URI_PARTS = parse_url($URI);
135- if (!empty($URI_PARTS["user"]))
136- $this->user = $URI_PARTS["user"];
137- if (!empty($URI_PARTS["pass"]))
138- $this->pass = $URI_PARTS["pass"];
139- if (empty($URI_PARTS["query"]))
140- $URI_PARTS["query"] = '';
141- if (empty($URI_PARTS["path"]))
142- $URI_PARTS["path"] = '';
143-
144- switch(strtolower($URI_PARTS["scheme"]))
145- {
146- case "http":
147- $this->host = $URI_PARTS["host"];
148- if(!empty($URI_PARTS["port"])) {
149- $this->port = $URI_PARTS["port"];
150- $this->host_port = $URI_PARTS["port"];
151- }
152- if($this->_connect($fp))
153- {
154- if($this->_isproxy)
155- {
156- // using proxy, send entire URI
157- $this->_httprequest($URI,$fp,$URI,$this->_httpmethod);
158- }
159- else
160- {
161- $path = $URI_PARTS["path"].($URI_PARTS["query"] ? "?".$URI_PARTS["query"] : "");
162- // no proxy, send only the path
163- $this->_httprequest($path, $fp, $URI, $this->_httpmethod);
164- }
165-
166- $this->_disconnect($fp);
167-
168- if($this->_redirectaddr)
169- {
170- /* url was redirected, check if we've hit the max depth */
171- if($this->maxredirs > $this->_redirectdepth)
172- {
173- // only follow redirect if it's on this site, or offsiteok is true
174- if(preg_match("|^http://".preg_quote($this->host)."|i",$this->_redirectaddr) || $this->offsiteok)
175- {
176- /* follow the redirect */
177- $this->_redirectdepth++;
178- $this->lastredirectaddr=$this->_redirectaddr;
179- $this->fetch($this->_redirectaddr);
180- }
181- }
182- }
183-
184- if($this->_framedepth < $this->maxframes && count($this->_frameurls) > 0)
185- {
186- $frameurls = $this->_frameurls;
187- $this->_frameurls = array();
188-
189- while(list(,$frameurl) = each($frameurls))
190- {
191- if($this->_framedepth < $this->maxframes)
192- {
193- $this->fetch($frameurl);
194- $this->_framedepth++;
195- }
196- else
197- break;
198- }
199- }
200- }
201- else
202- {
203- return false;
204- }
205- return true;
206- break;
207- case "https":
208- if(!$this->curl_path)
209- return false;
210- if(function_exists("is_executable"))
211- if (!is_executable($this->curl_path))
212- return false;
213- $this->host = $URI_PARTS["host"];
214- if(!empty($URI_PARTS["port"])) {
215- $this->port = $URI_PARTS["port"];
216- $this->host_port = $URI_PARTS["port"];
217- }
218- if($this->_isproxy)
219- {
220- // using proxy, send entire URI
221- $this->_httpsrequest($URI,$URI,$this->_httpmethod);
222- }
223- else
224- {
225- $path = $URI_PARTS["path"].($URI_PARTS["query"] ? "?".$URI_PARTS["query"] : "");
226- // no proxy, send only the path
227- $this->_httpsrequest($path, $URI, $this->_httpmethod);
228- }
229-
230- if($this->_redirectaddr)
231- {
232- /* url was redirected, check if we've hit the max depth */
233- if($this->maxredirs > $this->_redirectdepth)
234- {
235- // only follow redirect if it's on this site, or offsiteok is true
236- if(preg_match("|^http://".preg_quote($this->host)."|i",$this->_redirectaddr) || $this->offsiteok)
237- {
238- /* follow the redirect */
239- $this->_redirectdepth++;
240- $this->lastredirectaddr=$this->_redirectaddr;
241- $this->fetch($this->_redirectaddr);
242- }
243- }
244- }
245-
246- if($this->_framedepth < $this->maxframes && count($this->_frameurls) > 0)
247- {
248- $frameurls = $this->_frameurls;
249- $this->_frameurls = array();
250-
251- while(list(,$frameurl) = each($frameurls))
252- {
253- if($this->_framedepth < $this->maxframes)
254- {
255- $this->fetch($frameurl);
256- $this->_framedepth++;
257- }
258- else
259- break;
260- }
261- }
262- return true;
263- break;
264- default:
265- // not a valid protocol
266- $this->error = 'Invalid protocol "'.$URI_PARTS["scheme"].'"\n';
267- return false;
268- break;
269- }
270- return true;
271- }
272-
273-/*======================================================================*\
274- Function: submit
275- Purpose: submit an http form
276- Input: $URI the location to post the data
277- $formvars the formvars to use.
278- format: $formvars["var"] = "val";
279- $formfiles an array of files to submit
280- format: $formfiles["var"] = "/dir/filename.ext";
281- Output: $this->results the text output from the post
282-\*======================================================================*/
283-
284- function submit($URI, $formvars="", $formfiles="")
285- {
286- unset($postdata);
287-
288- $postdata = $this->_prepare_post_body($formvars, $formfiles);
289-
290- $URI_PARTS = parse_url($URI);
291- if (!empty($URI_PARTS["user"]))
292- $this->user = $URI_PARTS["user"];
293- if (!empty($URI_PARTS["pass"]))
294- $this->pass = $URI_PARTS["pass"];
295- if (empty($URI_PARTS["query"]))
296- $URI_PARTS["query"] = '';
297- if (empty($URI_PARTS["path"]))
298- $URI_PARTS["path"] = '';
299-
300- switch(strtolower($URI_PARTS["scheme"]))
301- {
302- case "http":
303- $this->host = $URI_PARTS["host"];
304- if(!empty($URI_PARTS["port"])) {
305- $this->port = $URI_PARTS["port"];
306- $this->host_port = $URI_PARTS["port"];
307- }
308- if($this->_connect($fp))
309- {
310- if($this->_isproxy)
311- {
312- // using proxy, send entire URI
313- $this->_httprequest($URI,$fp,$URI,$this->_submit_method,$this->_submit_type,$postdata);
314- }
315- else
316- {
317- $path = $URI_PARTS["path"].($URI_PARTS["query"] ? "?".$URI_PARTS["query"] : "");
318- // no proxy, send only the path
319- $this->_httprequest($path, $fp, $URI, $this->_submit_method, $this->_submit_type, $postdata);
320- }
321-
322- $this->_disconnect($fp);
323-
324- if($this->_redirectaddr)
325- {
326- /* url was redirected, check if we've hit the max depth */
327- if($this->maxredirs > $this->_redirectdepth)
328- {
329- if(!preg_match("|^".$URI_PARTS["scheme"]."://|", $this->_redirectaddr))
330- $this->_redirectaddr = $this->_expandlinks($this->_redirectaddr,$URI_PARTS["scheme"]."://".$URI_PARTS["host"]);
331-
332- // only follow redirect if it's on this site, or offsiteok is true
333- if(preg_match("|^http://".preg_quote($this->host)."|i",$this->_redirectaddr) || $this->offsiteok)
334- {
335- /* follow the redirect */
336- $this->_redirectdepth++;
337- $this->lastredirectaddr=$this->_redirectaddr;
338- if( strpos( $this->_redirectaddr, "?" ) > 0 )
339- $this->fetch($this->_redirectaddr); // the redirect has changed the request method from post to get
340- else
341- $this->submit($this->_redirectaddr,$formvars, $formfiles);
342- }
343- }
344- }
345-
346- if($this->_framedepth < $this->maxframes && count($this->_frameurls) > 0)
347- {
348- $frameurls = $this->_frameurls;
349- $this->_frameurls = array();
350-
351- while(list(,$frameurl) = each($frameurls))
352- {
353- if($this->_framedepth < $this->maxframes)
354- {
355- $this->fetch($frameurl);
356- $this->_framedepth++;
357- }
358- else
359- break;
360- }
361- }
362-
363- }
364- else
365- {
366- return false;
367- }
368- return true;
369- break;
370- case "https":
371- if(!$this->curl_path)
372- return false;
373- if(function_exists("is_executable"))
374- if (!is_executable($this->curl_path))
375- return false;
376- $this->host = $URI_PARTS["host"];
377- if(!empty($URI_PARTS["port"])) {
378- $this->port = $URI_PARTS["port"];
379- $this->host_port = $URI_PARTS["port"];
380- }
381- if($this->_isproxy)
382- {
383- // using proxy, send entire URI
384- $this->_httpsrequest($URI, $URI, $this->_submit_method, $this->_submit_type, $postdata);
385- }
386- else
387- {
388- $path = $URI_PARTS["path"].($URI_PARTS["query"] ? "?".$URI_PARTS["query"] : "");
389- // no proxy, send only the path
390- $this->_httpsrequest($path, $URI, $this->_submit_method, $this->_submit_type, $postdata);
391- }
392-
393- if($this->_redirectaddr)
394- {
395- /* url was redirected, check if we've hit the max depth */
396- if($this->maxredirs > $this->_redirectdepth)
397- {
398- if(!preg_match("|^".$URI_PARTS["scheme"]."://|", $this->_redirectaddr))
399- $this->_redirectaddr = $this->_expandlinks($this->_redirectaddr,$URI_PARTS["scheme"]."://".$URI_PARTS["host"]);
400-
401- // only follow redirect if it's on this site, or offsiteok is true
402- if(preg_match("|^http://".preg_quote($this->host)."|i",$this->_redirectaddr) || $this->offsiteok)
403- {
404- /* follow the redirect */
405- $this->_redirectdepth++;
406- $this->lastredirectaddr=$this->_redirectaddr;
407- if( strpos( $this->_redirectaddr, "?" ) > 0 )
408- $this->fetch($this->_redirectaddr); // the redirect has changed the request method from post to get
409- else
410- $this->submit($this->_redirectaddr,$formvars, $formfiles);
411- }
412- }
413- }
414-
415- if($this->_framedepth < $this->maxframes && count($this->_frameurls) > 0)
416- {
417- $frameurls = $this->_frameurls;
418- $this->_frameurls = array();
419-
420- while(list(,$frameurl) = each($frameurls))
421- {
422- if($this->_framedepth < $this->maxframes)
423- {
424- $this->fetch($frameurl);
425- $this->_framedepth++;
426- }
427- else
428- break;
429- }
430- }
431- return true;
432- break;
433-
434- default:
435- // not a valid protocol
436- $this->error = 'Invalid protocol "'.$URI_PARTS["scheme"].'"\n';
437- return false;
438- break;
439- }
440- return true;
441- }
442-
443-/*======================================================================*\
444- Function: fetchlinks
445- Purpose: fetch the links from a web page
446- Input: $URI where you are fetching from
447- Output: $this->results an array of the URLs
448-\*======================================================================*/
449-
450- function fetchlinks($URI)
451- {
452- if ($this->fetch($URI))
453- {
454- if($this->lastredirectaddr)
455- $URI = $this->lastredirectaddr;
456- if(is_array($this->results))
457- {
458- for($x=0;$x<count($this->results);$x++)
459- $this->results[$x] = $this->_striplinks($this->results[$x]);
460- }
461- else
462- $this->results = $this->_striplinks($this->results);
463-
464- if($this->expandlinks)
465- $this->results = $this->_expandlinks($this->results, $URI);
466- return true;
467- }
468- else
469- return false;
470- }
471-
472-/*======================================================================*\
473- Function: fetchform
474- Purpose: fetch the form elements from a web page
475- Input: $URI where you are fetching from
476- Output: $this->results the resulting html form
477-\*======================================================================*/
478-
479- function fetchform($URI)
480- {
481-
482- if ($this->fetch($URI))
483- {
484-
485- if(is_array($this->results))
486- {
487- for($x=0;$x<count($this->results);$x++)
488- $this->results[$x] = $this->_stripform($this->results[$x]);
489- }
490- else
491- $this->results = $this->_stripform($this->results);
492-
493- return true;
494- }
495- else
496- return false;
497- }
498-
499-
500-/*======================================================================*\
501- Function: fetchtext
502- Purpose: fetch the text from a web page, stripping the links
503- Input: $URI where you are fetching from
504- Output: $this->results the text from the web page
505-\*======================================================================*/
506-
507- function fetchtext($URI)
508- {
509- if($this->fetch($URI))
510- {
511- if(is_array($this->results))
512- {
513- for($x=0;$x<count($this->results);$x++)
514- $this->results[$x] = $this->_striptext($this->results[$x]);
515- }
516- else
517- $this->results = $this->_striptext($this->results);
518- return true;
519- }
520- else
521- return false;
522- }
523-
524-/*======================================================================*\
525- Function: submitlinks
526- Purpose: grab links from a form submission
527- Input: $URI where you are submitting from
528- Output: $this->results an array of the links from the post
529-\*======================================================================*/
530-
531- function submitlinks($URI, $formvars="", $formfiles="")
532- {
533- if($this->submit($URI,$formvars, $formfiles))
534- {
535- if($this->lastredirectaddr)
536- $URI = $this->lastredirectaddr;
537- if(is_array($this->results))
538- {
539- for($x=0;$x<count($this->results);$x++)
540- {
541- $this->results[$x] = $this->_striplinks($this->results[$x]);
542- if($this->expandlinks)
543- $this->results[$x] = $this->_expandlinks($this->results[$x],$URI);
544- }
545- }
546- else
547- {
548- $this->results = $this->_striplinks($this->results);
549- if($this->expandlinks)
550- $this->results = $this->_expandlinks($this->results,$URI);
551- }
552- return true;
553- }
554- else
555- return false;
556- }
557-
558-/*======================================================================*\
559- Function: submittext
560- Purpose: grab text from a form submission
561- Input: $URI where you are submitting from
562- Output: $this->results the text from the web page
563-\*======================================================================*/
564-
565- function submittext($URI, $formvars = "", $formfiles = "")
566- {
567- if($this->submit($URI,$formvars, $formfiles))
568- {
569- if($this->lastredirectaddr)
570- $URI = $this->lastredirectaddr;
571- if(is_array($this->results))
572- {
573- for($x=0;$x<count($this->results);$x++)
574- {
575- $this->results[$x] = $this->_striptext($this->results[$x]);
576- if($this->expandlinks)
577- $this->results[$x] = $this->_expandlinks($this->results[$x],$URI);
578- }
579- }
580- else
581- {
582- $this->results = $this->_striptext($this->results);
583- if($this->expandlinks)
584- $this->results = $this->_expandlinks($this->results,$URI);
585- }
586- return true;
587- }
588- else
589- return false;
590- }
591-
592-
593-
594-/*======================================================================*\
595- Function: set_submit_multipart
596- Purpose: Set the form submission content type to
597- multipart/form-data
598-\*======================================================================*/
599- function set_submit_multipart()
600- {
601- $this->_submit_type = "multipart/form-data";
602- }
603-
604-
605-/*======================================================================*\
606- Function: set_submit_normal
607- Purpose: Set the form submission content type to
608- application/x-www-form-urlencoded
609-\*======================================================================*/
610- function set_submit_normal()
611- {
612- $this->_submit_type = "application/x-www-form-urlencoded";
613- }
614-
615-
616-// XOOPS2 Hack begin
617-// Added on March 4, 2003 by onokazu@xoops.org
618-/*======================================================================*\
619- Function: set_submit_xml
620- Purpose: Set the submission content type to
621- text/xml
622-\*======================================================================*/
623- function set_submit_xml()
624- {
625- $this->_submit_type = "text/xml";
626- }
627-// XOOPS2 Hack end
628-
629-
630-/*======================================================================*\
631- Private functions
632-\*======================================================================*/
633-
634-
635-/*======================================================================*\
636- Function: _striplinks
637- Purpose: strip the hyperlinks from an html document
638- Input: $document document to strip.
639- Output: $match an array of the links
640-\*======================================================================*/
641-
642- function _striplinks($document)
643- {
644- preg_match_all("'<\s*a\s.*?href\s*=\s* # find <a href=
645- ([\"\'])? # find single or double quote
646- (?(1) (.*?)\\1 | ([^\s\>]+)) # if quote found, match up to next matching
647- # quote, otherwise match up to next space
648- 'isx",$document,$links);
649-
650-
651- // catenate the non-empty matches from the conditional subpattern
652-
653- while(list($key,$val) = each($links[2]))
654- {
655- if(!empty($val))
656- $match[] = $val;
657- }
658-
659- while(list($key,$val) = each($links[3]))
660- {
661- if(!empty($val))
662- $match[] = $val;
663- }
664-
665- // return the links
666- return $match;
667- }
668-
669-/*======================================================================*\
670- Function: _stripform
671- Purpose: strip the form elements from an html document
672- Input: $document document to strip.
673- Output: $match an array of the links
674-\*======================================================================*/
675-
676- function _stripform($document)
677- {
678- preg_match_all("'<\/?(FORM|INPUT|SELECT|TEXTAREA|(OPTION))[^<>]*>(?(2)(.*(?=<\/?(option|select)[^<>]*>[\r\n]*)|(?=[\r\n]*))|(?=[\r\n]*))'Usi",$document,$elements);
679-
680- // catenate the matches
681- $match = implode("\r\n",$elements[0]);
682-
683- // return the links
684- return $match;
685- }
686-
687-
688-
689-/*======================================================================*\
690- Function: _striptext
691- Purpose: strip the text from an html document
692- Input: $document document to strip.
693- Output: $text the resulting text
694-\*======================================================================*/
695-
696- function _striptext($document)
697- {
698-
699- // I didn't use preg eval (//e) since that is only available in PHP 4.0.
700- // so, list your entities one by one here. I included some of the
701- // more common ones.
702-
703- $search = array("'<script[^>]*?>.*?</script>'si", // strip out javascript
704- "'<[\/\!]*?[^<>]*?>'si", // strip out html tags
705- "'([\r\n])[\s]+'", // strip out white space
706- "'&(quot|#34|#034|#x22);'i", // replace html entities
707- "'&(amp|#38|#038|#x26);'i", // added hexadecimal values
708- "'&(lt|#60|#060|#x3c);'i",
709- "'&(gt|#62|#062|#x3e);'i",
710- "'&(nbsp|#160|#xa0);'i",
711- "'&(iexcl|#161);'i",
712- "'&(cent|#162);'i",
713- "'&(pound|#163);'i",
714- "'&(copy|#169);'i",
715- "'&(reg|#174);'i",
716- "'&(deg|#176);'i",
717- "'&(#39|#039|#x27);'",
718- "'&(euro|#8364);'i", // europe
719- "'&a(uml|UML);'", // german
720- "'&o(uml|UML);'",
721- "'&u(uml|UML);'",
722- "'&A(uml|UML);'",
723- "'&O(uml|UML);'",
724- "'&U(uml|UML);'",
725- "'&szlig;'i",
726- );
727- $replace = array( "",
728- "",
729- "\\1",
730- "\"",
731- "&",
732- "<",
733- ">",
734- " ",
735- chr(161),
736- chr(162),
737- chr(163),
738- chr(169),
739- chr(174),
740- chr(176),
741- chr(39),
742- chr(128),
743- chr(228),
744- chr(246),
745- chr(252),
746- chr(196),
747- chr(214),
748- chr(220),
749- chr(223),
750- );
751-
752- $text = preg_replace($search,$replace,$document);
753-
754- return $text;
755- }
756-
757-/*======================================================================*\
758- Function: _expandlinks
759- Purpose: expand each link into a fully qualified URL
760- Input: $links the links to qualify
761- $URI the full URI to get the base from
762- Output: $expandedLinks the expanded links
763-\*======================================================================*/
764-
765- function _expandlinks($links,$URI)
766- {
767-
768- preg_match("/^[^\?]+/",$URI,$match);
769-
770- $match = preg_replace("|/[^\/\.]+\.[^\/\.]+$|","",$match[0]);
771- $match = preg_replace("|/$|","",$match);
772- $match_part = parse_url($match);
773- $match_root =
774- $match_part["scheme"]."://".$match_part["host"];
775-
776- $search = array( "|^http://".preg_quote($this->host)."|i",
777- "|^(\/)|i",
778- "|^(?!http://)(?!mailto:)|i",
779- "|/\./|",
780- "|/[^\/]+/\.\./|"
781- );
782-
783- $replace = array( "",
784- $match_root."/",
785- $match."/",
786- "/",
787- "/"
788- );
789-
790- $expandedLinks = preg_replace($search,$replace,$links);
791-
792- return $expandedLinks;
793- }
794-
795-/*======================================================================*\
796- Function: _httprequest
797- Purpose: go get the http data from the server
798- Input: $url the url to fetch
799- $fp the current open file pointer
800- $URI the full URI
801- $body body contents to send if any (POST)
802- Output:
803-\*======================================================================*/
804-
805- function _httprequest($url,$fp,$URI,$http_method,$content_type="",$body="")
806- {
807- $cookie_headers = '';
808- if($this->passcookies && $this->_redirectaddr)
809- $this->setcookies();
810-
811- $URI_PARTS = parse_url($URI);
812- if(empty($url))
813- $url = "/";
814- $headers = $http_method." ".$url." ".$this->_httpversion."\r\n";
815- if(!empty($this->agent))
816- $headers .= "User-Agent: ".$this->agent."\r\n";
817- if(!empty($this->host) && !isset($this->rawheaders['Host'])) {
818- $headers .= "Host: ".$this->host;
819- if(!empty($this->host_port))
820- $headers .= ":".$this->host_port;
821- $headers .= "\r\n";
822- }
823- if(!empty($this->accept))
824- $headers .= "Accept: ".$this->accept."\r\n";
825- if(!empty($this->referer))
826- $headers .= "Referer: ".$this->referer."\r\n";
827- if(!empty($this->cookies))
828- {
829- if(!is_array($this->cookies))
830- $this->cookies = (array)$this->cookies;
831-
832- reset($this->cookies);
833- if ( count($this->cookies) > 0 ) {
834- $cookie_headers .= 'Cookie: ';
835- foreach ( $this->cookies as $cookieKey => $cookieVal ) {
836- $cookie_headers .= $cookieKey."=".urlencode($cookieVal)."; ";
837- }
838- $headers .= substr($cookie_headers,0,-2) . "\r\n";
839- }
840- }
841- if(!empty($this->rawheaders))
842- {
843- if(!is_array($this->rawheaders))
844- $this->rawheaders = (array)$this->rawheaders;
845- while(list($headerKey,$headerVal) = each($this->rawheaders))
846- $headers .= $headerKey.": ".$headerVal."\r\n";
847- }
848- if(!empty($content_type)) {
849- $headers .= "Content-type: $content_type";
850- if ($content_type == "multipart/form-data")
851- $headers .= "; boundary=".$this->_mime_boundary;
852- $headers .= "\r\n";
853- }
854- if(!empty($body))
855- $headers .= "Content-length: ".strlen($body)."\r\n";
856- if(!empty($this->user) || !empty($this->pass))
857- $headers .= "Authorization: Basic ".base64_encode($this->user.":".$this->pass)."\r\n";
858-
859- //add proxy auth headers
860- if(!empty($this->proxy_user))
861- $headers .= 'Proxy-Authorization: ' . 'Basic ' . base64_encode($this->proxy_user . ':' . $this->proxy_pass)."\r\n";
862-
863-
864- $headers .= "\r\n";
865-
866- // set the read timeout if needed
867- if ($this->read_timeout > 0)
868- socket_set_timeout($fp, $this->read_timeout);
869- $this->timed_out = false;
870-
871- fwrite($fp,$headers.$body,strlen($headers.$body));
872-
873- $this->_redirectaddr = false;
874- unset($this->headers);
875-
876- while($currentHeader = fgets($fp,$this->_maxlinelen))
877- {
878- if ($this->read_timeout > 0 && $this->_check_timeout($fp))
879- {
880- $this->status=-100;
881- return false;
882- }
883-
884- if($currentHeader == "\r\n")
885- break;
886-
887- // if a header begins with Location: or URI:, set the redirect
888- if(preg_match("/^(Location:|URI:)/i",$currentHeader))
889- {
890- // get URL portion of the redirect
891- preg_match("/^(Location:|URI:)[ ]+(.*)/i",chop($currentHeader),$matches);
892- // look for :// in the Location header to see if hostname is included
893- if(!preg_match("|\:\/\/|",$matches[2]))
894- {
895- // no host in the path, so prepend
896- $this->_redirectaddr = $URI_PARTS["scheme"]."://".$this->host;
897- if(!empty($this->host_port))
898- $this->_redirectaddr .= ":".$this->host_port;
899- // eliminate double slash
900- if(!preg_match("|^/|",$matches[2]))
901- $this->_redirectaddr .= "/".$matches[2];
902- else
903- $this->_redirectaddr .= $matches[2];
904- }
905- else
906- $this->_redirectaddr = $matches[2];
907- }
908-
909- if(preg_match("|^HTTP/|",$currentHeader))
910- {
911- if(preg_match("|^HTTP/[^\s]*\s(.*?)\s|",$currentHeader, $status))
912- {
913- $this->status= $status[1];
914- }
915- $this->response_code = $currentHeader;
916- }
917-
918- $this->headers[] = $currentHeader;
919- }
920-
921- $results = '';
922- do {
923- $_data = fread($fp, $this->maxlength);
924- if (strlen($_data) == 0) {
925- break;
926- }
927- $results .= $_data;
928- } while(true);
929-
930- if ($this->read_timeout > 0 && $this->_check_timeout($fp))
931- {
932- $this->status=-100;
933- return false;
934- }
935-
936- // check if there is a a redirect meta tag
937-
938- if(preg_match("'<meta[\s]*http-equiv[^>]*?content[\s]*=[\s]*[\"\']?\d+;[\s]*URL[\s]*=[\s]*([^\"\']*?)[\"\']?>'i",$results,$match))
939-
940- {
941- $this->_redirectaddr = $this->_expandlinks($match[1],$URI);
942- }
943-
944- // have we hit our frame depth and is there frame src to fetch?
945- if(($this->_framedepth < $this->maxframes) && preg_match_all("'<frame\s+.*src[\s]*=[\'\"]?([^\'\"\>]+)'i",$results,$match))
946- {
947- $this->results[] = $results;
948- for($x=0; $x<count($match[1]); $x++)
949- $this->_frameurls[] = $this->_expandlinks($match[1][$x],$URI_PARTS["scheme"]."://".$this->host);
950- }
951- // have we already fetched framed content?
952- elseif(is_array($this->results))
953- $this->results[] = $results;
954- // no framed content
955- else
956- $this->results = $results;
957-
958- return true;
959- }
960-
961-/*======================================================================*\
962- Function: _httpsrequest
963- Purpose: go get the https data from the server using curl
964- Input: $url the url to fetch
965- $URI the full URI
966- $body body contents to send if any (POST)
967- Output:
968-\*======================================================================*/
969-
970- function _httpsrequest($url,$URI,$http_method,$content_type="",$body="")
971- {
972- if($this->passcookies && $this->_redirectaddr)
973- $this->setcookies();
974-
975- $headers = array();
976-
977- $URI_PARTS = parse_url($URI);
978- if(empty($url))
979- $url = "/";
980- // GET ... header not needed for curl
981- //$headers[] = $http_method." ".$url." ".$this->_httpversion;
982- if(!empty($this->agent))
983- $headers[] = "User-Agent: ".$this->agent;
984- if(!empty($this->host))
985- if(!empty($this->host_port))
986- $headers[] = "Host: ".$this->host.":".$this->host_port;
987- else
988- $headers[] = "Host: ".$this->host;
989- if(!empty($this->accept))
990- $headers[] = "Accept: ".$this->accept;
991- if(!empty($this->referer))
992- $headers[] = "Referer: ".$this->referer;
993- if(!empty($this->cookies))
994- {
995- if(!is_array($this->cookies))
996- $this->cookies = (array)$this->cookies;
997-
998- reset($this->cookies);
999- if ( count($this->cookies) > 0 ) {
1000- $cookie_str = 'Cookie: ';
1001- foreach ( $this->cookies as $cookieKey => $cookieVal ) {
1002- $cookie_str .= $cookieKey."=".urlencode($cookieVal)."; ";
1003- }
1004- $headers[] = substr($cookie_str,0,-2);
1005- }
1006- }
1007- if(!empty($this->rawheaders))
1008- {
1009- if(!is_array($this->rawheaders))
1010- $this->rawheaders = (array)$this->rawheaders;
1011- while(list($headerKey,$headerVal) = each($this->rawheaders))
1012- $headers[] = $headerKey.": ".$headerVal;
1013- }
1014- if(!empty($content_type)) {
1015- if ($content_type == "multipart/form-data")
1016- $headers[] = "Content-type: $content_type; boundary=".$this->_mime_boundary;
1017- else
1018- $headers[] = "Content-type: $content_type";
1019- }
1020- if(!empty($body))
1021- $headers[] = "Content-length: ".strlen($body);
1022- if(!empty($this->user) || !empty($this->pass))
1023- $headers[] = "Authorization: BASIC ".base64_encode($this->user.":".$this->pass);
1024-
1025- for($curr_header = 0; $curr_header < count($headers); $curr_header++) {
1026- $safer_header = strtr( $headers[$curr_header], "\"", " " );
1027- $cmdline_params .= " -H \"".$safer_header."\"";
1028- }
1029-
1030- if(!empty($body))
1031- $cmdline_params .= " -d \"$body\"";
1032-
1033- if($this->read_timeout > 0)
1034- $cmdline_params .= " -m ".$this->read_timeout;
1035-
1036- $headerfile = tempnam($temp_dir, "sno");
1037-
1038- exec($this->curl_path." -k -D \"$headerfile\"".$cmdline_params." \"".escapeshellcmd($URI)."\"",$results,$return);
1039-
1040- if($return)
1041- {
1042- $this->error = "Error: cURL could not retrieve the document, error $return.";
1043- return false;
1044- }
1045-
1046-
1047- $results = implode("\r\n",$results);
1048-
1049- $result_headers = file("$headerfile");
1050-
1051- $this->_redirectaddr = false;
1052- unset($this->headers);
1053-
1054- for($currentHeader = 0; $currentHeader < count($result_headers); $currentHeader++)
1055- {
1056-
1057- // if a header begins with Location: or URI:, set the redirect
1058- if(preg_match("/^(Location: |URI: )/i",$result_headers[$currentHeader]))
1059- {
1060- // get URL portion of the redirect
1061- preg_match("/^(Location: |URI:)\s+(.*)/",chop($result_headers[$currentHeader]),$matches);
1062- // look for :// in the Location header to see if hostname is included
1063- if(!preg_match("|\:\/\/|",$matches[2]))
1064- {
1065- // no host in the path, so prepend
1066- $this->_redirectaddr = $URI_PARTS["scheme"]."://".$this->host;
1067- if(!empty($this->host_port))
1068- $this->_redirectaddr .= ":".$this->host_port;
1069- // eliminate double slash
1070- if(!preg_match("|^/|",$matches[2]))
1071- $this->_redirectaddr .= "/".$matches[2];
1072- else
1073- $this->_redirectaddr .= $matches[2];
1074- }
1075- else
1076- $this->_redirectaddr = $matches[2];
1077- }
1078-
1079- if(preg_match("|^HTTP/|",$result_headers[$currentHeader]))
1080- $this->response_code = $result_headers[$currentHeader];
1081-
1082- $this->headers[] = $result_headers[$currentHeader];
1083- }
1084-
1085- // check if there is a a redirect meta tag
1086-
1087- if(preg_match("'<meta[\s]*http-equiv[^>]*?content[\s]*=[\s]*[\"\']?\d+;[\s]*URL[\s]*=[\s]*([^\"\']*?)[\"\']?>'i",$results,$match))
1088- {
1089- $this->_redirectaddr = $this->_expandlinks($match[1],$URI);
1090- }
1091-
1092- // have we hit our frame depth and is there frame src to fetch?
1093- if(($this->_framedepth < $this->maxframes) && preg_match_all("'<frame\s+.*src[\s]*=[\'\"]?([^\'\"\>]+)'i",$results,$match))
1094- {
1095- $this->results[] = $results;
1096- for($x=0; $x<count($match[1]); $x++)
1097- $this->_frameurls[] = $this->_expandlinks($match[1][$x],$URI_PARTS["scheme"]."://".$this->host);
1098- }
1099- // have we already fetched framed content?
1100- elseif(is_array($this->results))
1101- $this->results[] = $results;
1102- // no framed content
1103- else
1104- $this->results = $results;
1105-
1106- unlink("$headerfile");
1107-
1108- return true;
1109- }
1110-
1111-/*======================================================================*\
1112- Function: setcookies()
1113- Purpose: set cookies for a redirection
1114-\*======================================================================*/
1115-
1116- function setcookies()
1117- {
1118- for($x=0; $x<count($this->headers); $x++)
1119- {
1120- if(preg_match('/^set-cookie:[\s]+([^=]+)=([^;]+)/i', $this->headers[$x],$match))
1121- $this->cookies[$match[1]] = urldecode($match[2]);
1122- }
1123- }
1124-
1125-
1126-/*======================================================================*\
1127- Function: _check_timeout
1128- Purpose: checks whether timeout has occurred
1129- Input: $fp file pointer
1130-\*======================================================================*/
1131-
1132- function _check_timeout($fp)
1133- {
1134- if ($this->read_timeout > 0) {
1135- $fp_status = socket_get_status($fp);
1136- if ($fp_status["timed_out"]) {
1137- $this->timed_out = true;
1138- return true;
1139- }
1140- }
1141- return false;
1142- }
1143-
1144-/*======================================================================*\
1145- Function: _connect
1146- Purpose: make a socket connection
1147- Input: $fp file pointer
1148-\*======================================================================*/
1149-
1150- function _connect(&$fp)
1151- {
1152- if(!empty($this->proxy_host) && !empty($this->proxy_port))
1153- {
1154- $this->_isproxy = true;
1155-
1156- $host = $this->proxy_host;
1157- $port = $this->proxy_port;
1158- }
1159- else
1160- {
1161- $host = $this->host;
1162- $port = $this->port;
1163- }
1164-
1165- $this->status = 0;
1166-
1167- if($fp = fsockopen(
1168- $host,
1169- $port,
1170- $errno,
1171- $errstr,
1172- $this->_fp_timeout
1173- ))
1174- {
1175- // socket connection succeeded
1176-
1177- return true;
1178- }
1179- else
1180- {
1181- // socket connection failed
1182- $this->status = $errno;
1183- switch($errno)
1184- {
1185- case -3:
1186- $this->error="socket creation failed (-3)";
1187- case -4:
1188- $this->error="dns lookup failure (-4)";
1189- case -5:
1190- $this->error="connection refused or timed out (-5)";
1191- default:
1192- $this->error="connection failed (".$errno.")";
1193- }
1194- return false;
1195- }
1196- }
1197-/*======================================================================*\
1198- Function: _disconnect
1199- Purpose: disconnect a socket connection
1200- Input: $fp file pointer
1201-\*======================================================================*/
1202-
1203- function _disconnect($fp)
1204- {
1205- return(fclose($fp));
1206- }
1207-
1208-
1209-/*======================================================================*\
1210- Function: _prepare_post_body
1211- Purpose: Prepare post body according to encoding type
1212- Input: $formvars - form variables
1213- $formfiles - form upload files
1214- Output: post body
1215-\*======================================================================*/
1216-
1217- function _prepare_post_body($formvars, $formfiles)
1218- {
1219- settype($formvars, "array");
1220- settype($formfiles, "array");
1221- $postdata = '';
1222-
1223- if (count($formvars) == 0 && count($formfiles) == 0)
1224- return;
1225-
1226- switch ($this->_submit_type) {
1227- case "application/x-www-form-urlencoded":
1228- reset($formvars);
1229- while(list($key,$val) = each($formvars)) {
1230- if (is_array($val) || is_object($val)) {
1231- while (list($cur_key, $cur_val) = each($val)) {
1232- $postdata .= urlencode($key)."[]=".urlencode($cur_val)."&";
1233- }
1234- } else
1235- $postdata .= urlencode($key)."=".urlencode($val)."&";
1236- }
1237- break;
1238-
1239- case "multipart/form-data":
1240- $this->_mime_boundary = "Snoopy".md5(uniqid(microtime()));
1241-
1242- reset($formvars);
1243- while(list($key,$val) = each($formvars)) {
1244- if (is_array($val) || is_object($val)) {
1245- while (list($cur_key, $cur_val) = each($val)) {
1246- $postdata .= "--".$this->_mime_boundary."\r\n";
1247- $postdata .= "Content-Disposition: form-data; name=\"$key\[\]\"\r\n\r\n";
1248- $postdata .= "$cur_val\r\n";
1249- }
1250- } else {
1251- $postdata .= "--".$this->_mime_boundary."\r\n";
1252- $postdata .= "Content-Disposition: form-data; name=\"$key\"\r\n\r\n";
1253- $postdata .= "$val\r\n";
1254- }
1255- }
1256-
1257- reset($formfiles);
1258- while (list($field_name, $file_names) = each($formfiles)) {
1259- settype($file_names, "array");
1260- while (list(, $file_name) = each($file_names)) {
1261- if (!is_readable($file_name)) continue;
1262-
1263- $fp = fopen($file_name, "r");
1264- $file_content = fread($fp, filesize($file_name));
1265- fclose($fp);
1266- $base_name = basename($file_name);
1267-
1268- $postdata .= "--".$this->_mime_boundary."\r\n";
1269- $postdata .= "Content-Disposition: form-data; name=\"$field_name\"; filename=\"$base_name\"\r\n\r\n";
1270- $postdata .= "$file_content\r\n";
1271- }
1272- }
1273- $postdata .= "--".$this->_mime_boundary."--\r\n";
1274- break;
1275- // XOOPS2 Hack begin
1276- // Added on March 4, 2003 by onokazu@xoops.org
1277- case "text/xml":
1278- default:
1279- $postdata = $formvars[0];
1280- break;
1281- // XOOPS2 Hack end
1282- }
1283-
1284- return $postdata;
1285- }
1286-}
1287-
1288-?>
1+<?php
2+
3+/*************************************************
4+
5+Snoopy - the PHP net client
6+Author: Monte Ohrt <monte@ispi.net>
7+Copyright (c): 1999-2008 New Digital Group, all rights reserved
8+Version: 1.2.4
9+
10+ * This library is free software; you can redistribute it and/or
11+ * modify it under the terms of the GNU Lesser General Public
12+ * License as published by the Free Software Foundation; either
13+ * version 2.1 of the License, or (at your option) any later version.
14+ *
15+ * This library is distributed in the hope that it will be useful,
16+ * but WITHOUT ANY WARRANTY; without even the implied warranty of
17+ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
18+ * Lesser General Public License for more details.
19+ *
20+ * You should have received a copy of the GNU Lesser General Public
21+ * License along with this library; if not, write to the Free Software
22+ * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
23+
24+You may contact the author of Snoopy by e-mail at:
25+monte@ohrt.com
26+
27+The latest version of Snoopy can be obtained from:
28+http://snoopy.sourceforge.net/
29+
30+*************************************************/
31+
32+class Snoopy
33+{
34+ /**** Public variables ****/
35+
36+ /* user definable vars */
37+
38+ var $host = "www.php.net"; // host name we are connecting to
39+ var $port = 80; // port we are connecting to
40+ var $proxy_host = ""; // proxy host to use
41+ var $proxy_port = ""; // proxy port to use
42+ var $proxy_user = ""; // proxy user to use
43+ var $proxy_pass = ""; // proxy password to use
44+
45+ var $agent = "Snoopy v1.2.4"; // agent we masquerade as
46+ var $referer = ""; // referer info to pass
47+ var $cookies = array(); // array of cookies to pass
48+ // $cookies["username"]="joe";
49+ var $rawheaders = array(); // array of raw headers to send
50+ // $rawheaders["Content-type"]="text/html";
51+
52+ var $maxredirs = 5; // http redirection depth maximum. 0 = disallow
53+ var $lastredirectaddr = ""; // contains address of last redirected address
54+ var $offsiteok = true; // allows redirection off-site
55+ var $maxframes = 0; // frame content depth maximum. 0 = disallow
56+ var $expandlinks = true; // expand links to fully qualified URLs.
57+ // this only applies to fetchlinks()
58+ // submitlinks(), and submittext()
59+ var $passcookies = true; // pass set cookies back through redirects
60+ // NOTE: this currently does not respect
61+ // dates, domains or paths.
62+
63+ var $user = ""; // user for http authentication
64+ var $pass = ""; // password for http authentication
65+
66+ // http accept types
67+ var $accept = "image/gif, image/x-xbitmap, image/jpeg, image/pjpeg, */*";
68+
69+ var $results = ""; // where the content is put
70+
71+ var $error = ""; // error messages sent here
72+ var $response_code = ""; // response code returned from server
73+ var $headers = array(); // headers returned from server sent here
74+ var $maxlength = 500000; // max return data length (body)
75+ var $read_timeout = 0; // timeout on read operations, in seconds
76+ // supported only since PHP 4 Beta 4
77+ // set to 0 to disallow timeouts
78+ var $timed_out = false; // if a read operation timed out
79+ var $status = 0; // http request status
80+
81+ var $temp_dir = "/tmp"; // temporary directory that the webserver
82+ // has permission to write to.
83+ // under Windows, this should be C:\temp
84+
85+ var $curl_path = "/usr/local/bin/curl";
86+ // Snoopy will use cURL for fetching
87+ // SSL content if a full system path to
88+ // the cURL binary is supplied here.
89+ // set to false if you do not have
90+ // cURL installed. See http://curl.haxx.se
91+ // for details on installing cURL.
92+ // Snoopy does *not* use the cURL
93+ // library functions built into php,
94+ // as these functions are not stable
95+ // as of this Snoopy release.
96+
97+ /**** Private variables ****/
98+
99+ var $_maxlinelen = 4096; // max line length (headers)
100+
101+ var $_httpmethod = "GET"; // default http request method
102+ var $_httpversion = "HTTP/1.0"; // default http request version
103+ var $_submit_method = "POST"; // default submit method
104+ var $_submit_type = "application/x-www-form-urlencoded"; // default submit type
105+ var $_mime_boundary = ""; // MIME boundary for multipart/form-data submit type
106+ var $_redirectaddr = false; // will be set if page fetched is a redirect
107+ var $_redirectdepth = 0; // increments on an http redirect
108+ var $_frameurls = array(); // frame src urls
109+ var $_framedepth = 0; // increments on frame depth
110+
111+ var $_isproxy = false; // set if using a proxy server
112+ var $_fp_timeout = 30; // timeout for socket connection
113+
114+/*======================================================================*\
115+ Function: fetch
116+ Purpose: fetch the contents of a web page
117+ (and possibly other protocols in the
118+ future like ftp, nntp, gopher, etc.)
119+ Input: $URI the location of the page to fetch
120+ Output: $this->results the output text from the fetch
121+\*======================================================================*/
122+
123+ function fetch($URI)
124+ {
125+
126+ //preg_match("|^([^:]+)://([^:/]+)(:[\d]+)*(.*)|",$URI,$URI_PARTS);
127+ $URI_PARTS = parse_url($URI);
128+ if (!empty($URI_PARTS["user"]))
129+ $this->user = $URI_PARTS["user"];
130+ if (!empty($URI_PARTS["pass"]))
131+ $this->pass = $URI_PARTS["pass"];
132+ if (empty($URI_PARTS["query"]))
133+ $URI_PARTS["query"] = '';
134+ if (empty($URI_PARTS["path"]))
135+ $URI_PARTS["path"] = '';
136+
137+ switch(strtolower($URI_PARTS["scheme"]))
138+ {
139+ case "http":
140+ $this->host = $URI_PARTS["host"];
141+ if(!empty($URI_PARTS["port"]))
142+ $this->port = $URI_PARTS["port"];
143+ if($this->_connect($fp))
144+ {
145+ if($this->_isproxy)
146+ {
147+ // using proxy, send entire URI
148+ $this->_httprequest($URI,$fp,$URI,$this->_httpmethod);
149+ }
150+ else
151+ {
152+ $path = $URI_PARTS["path"].($URI_PARTS["query"] ? "?".$URI_PARTS["query"] : "");
153+ // no proxy, send only the path
154+ $this->_httprequest($path, $fp, $URI, $this->_httpmethod);
155+ }
156+
157+ $this->_disconnect($fp);
158+
159+ if($this->_redirectaddr)
160+ {
161+ /* url was redirected, check if we've hit the max depth */
162+ if($this->maxredirs > $this->_redirectdepth)
163+ {
164+ // only follow redirect if it's on this site, or offsiteok is true
165+ if(preg_match("|^http://".preg_quote($this->host)."|i",$this->_redirectaddr) || $this->offsiteok)
166+ {
167+ /* follow the redirect */
168+ $this->_redirectdepth++;
169+ $this->lastredirectaddr=$this->_redirectaddr;
170+ $this->fetch($this->_redirectaddr);
171+ }
172+ }
173+ }
174+
175+ if($this->_framedepth < $this->maxframes && count($this->_frameurls) > 0)
176+ {
177+ $frameurls = $this->_frameurls;
178+ $this->_frameurls = array();
179+
180+ while(list(,$frameurl) = each($frameurls))
181+ {
182+ if($this->_framedepth < $this->maxframes)
183+ {
184+ $this->fetch($frameurl);
185+ $this->_framedepth++;
186+ }
187+ else
188+ break;
189+ }
190+ }
191+ }
192+ else
193+ {
194+ return false;
195+ }
196+ return true;
197+ break;
198+ case "https":
199+ if(!$this->curl_path)
200+ return false;
201+ if(function_exists("is_executable"))
202+ if (!is_executable($this->curl_path))
203+ return false;
204+ $this->host = $URI_PARTS["host"];
205+ if(!empty($URI_PARTS["port"]))
206+ $this->port = $URI_PARTS["port"];
207+ if($this->_isproxy)
208+ {
209+ // using proxy, send entire URI
210+ $this->_httpsrequest($URI,$URI,$this->_httpmethod);
211+ }
212+ else
213+ {
214+ $path = $URI_PARTS["path"].($URI_PARTS["query"] ? "?".$URI_PARTS["query"] : "");
215+ // no proxy, send only the path
216+ $this->_httpsrequest($path, $URI, $this->_httpmethod);
217+ }
218+
219+ if($this->_redirectaddr)
220+ {
221+ /* url was redirected, check if we've hit the max depth */
222+ if($this->maxredirs > $this->_redirectdepth)
223+ {
224+ // only follow redirect if it's on this site, or offsiteok is true
225+ if(preg_match("|^http://".preg_quote($this->host)."|i",$this->_redirectaddr) || $this->offsiteok)
226+ {
227+ /* follow the redirect */
228+ $this->_redirectdepth++;
229+ $this->lastredirectaddr=$this->_redirectaddr;
230+ $this->fetch($this->_redirectaddr);
231+ }
232+ }
233+ }
234+
235+ if($this->_framedepth < $this->maxframes && count($this->_frameurls) > 0)
236+ {
237+ $frameurls = $this->_frameurls;
238+ $this->_frameurls = array();
239+
240+ while(list(,$frameurl) = each($frameurls))
241+ {
242+ if($this->_framedepth < $this->maxframes)
243+ {
244+ $this->fetch($frameurl);
245+ $this->_framedepth++;
246+ }
247+ else
248+ break;
249+ }
250+ }
251+ return true;
252+ break;
253+ default:
254+ // not a valid protocol
255+ $this->error = 'Invalid protocol "'.$URI_PARTS["scheme"].'"\n';
256+ return false;
257+ break;
258+ }
259+ return true;
260+ }
261+
262+/*======================================================================*\
263+ Function: submit
264+ Purpose: submit an http form
265+ Input: $URI the location to post the data
266+ $formvars the formvars to use.
267+ format: $formvars["var"] = "val";
268+ $formfiles an array of files to submit
269+ format: $formfiles["var"] = "/dir/filename.ext";
270+ Output: $this->results the text output from the post
271+\*======================================================================*/
272+
273+ function submit($URI, $formvars="", $formfiles="")
274+ {
275+ unset($postdata);
276+
277+ $postdata = $this->_prepare_post_body($formvars, $formfiles);
278+
279+ $URI_PARTS = parse_url($URI);
280+ if (!empty($URI_PARTS["user"]))
281+ $this->user = $URI_PARTS["user"];
282+ if (!empty($URI_PARTS["pass"]))
283+ $this->pass = $URI_PARTS["pass"];
284+ if (empty($URI_PARTS["query"]))
285+ $URI_PARTS["query"] = '';
286+ if (empty($URI_PARTS["path"]))
287+ $URI_PARTS["path"] = '';
288+
289+ switch(strtolower($URI_PARTS["scheme"]))
290+ {
291+ case "http":
292+ $this->host = $URI_PARTS["host"];
293+ if(!empty($URI_PARTS["port"]))
294+ $this->port = $URI_PARTS["port"];
295+ if($this->_connect($fp))
296+ {
297+ if($this->_isproxy)
298+ {
299+ // using proxy, send entire URI
300+ $this->_httprequest($URI,$fp,$URI,$this->_submit_method,$this->_submit_type,$postdata);
301+ }
302+ else
303+ {
304+ $path = $URI_PARTS["path"].($URI_PARTS["query"] ? "?".$URI_PARTS["query"] : "");
305+ // no proxy, send only the path
306+ $this->_httprequest($path, $fp, $URI, $this->_submit_method, $this->_submit_type, $postdata);
307+ }
308+
309+ $this->_disconnect($fp);
310+
311+ if($this->_redirectaddr)
312+ {
313+ /* url was redirected, check if we've hit the max depth */
314+ if($this->maxredirs > $this->_redirectdepth)
315+ {
316+ if(!preg_match("|^".$URI_PARTS["scheme"]."://|", $this->_redirectaddr))
317+ $this->_redirectaddr = $this->_expandlinks($this->_redirectaddr,$URI_PARTS["scheme"]."://".$URI_PARTS["host"]);
318+
319+ // only follow redirect if it's on this site, or offsiteok is true
320+ if(preg_match("|^http://".preg_quote($this->host)."|i",$this->_redirectaddr) || $this->offsiteok)
321+ {
322+ /* follow the redirect */
323+ $this->_redirectdepth++;
324+ $this->lastredirectaddr=$this->_redirectaddr;
325+ if( strpos( $this->_redirectaddr, "?" ) > 0 )
326+ $this->fetch($this->_redirectaddr); // the redirect has changed the request method from post to get
327+ else
328+ $this->submit($this->_redirectaddr,$formvars, $formfiles);
329+ }
330+ }
331+ }
332+
333+ if($this->_framedepth < $this->maxframes && count($this->_frameurls) > 0)
334+ {
335+ $frameurls = $this->_frameurls;
336+ $this->_frameurls = array();
337+
338+ while(list(,$frameurl) = each($frameurls))
339+ {
340+ if($this->_framedepth < $this->maxframes)
341+ {
342+ $this->fetch($frameurl);
343+ $this->_framedepth++;
344+ }
345+ else
346+ break;
347+ }
348+ }
349+
350+ }
351+ else
352+ {
353+ return false;
354+ }
355+ return true;
356+ break;
357+ case "https":
358+ if(!$this->curl_path)
359+ return false;
360+ if(function_exists("is_executable"))
361+ if (!is_executable($this->curl_path))
362+ return false;
363+ $this->host = $URI_PARTS["host"];
364+ if(!empty($URI_PARTS["port"]))
365+ $this->port = $URI_PARTS["port"];
366+ if($this->_isproxy)
367+ {
368+ // using proxy, send entire URI
369+ $this->_httpsrequest($URI, $URI, $this->_submit_method, $this->_submit_type, $postdata);
370+ }
371+ else
372+ {
373+ $path = $URI_PARTS["path"].($URI_PARTS["query"] ? "?".$URI_PARTS["query"] : "");
374+ // no proxy, send only the path
375+ $this->_httpsrequest($path, $URI, $this->_submit_method, $this->_submit_type, $postdata);
376+ }
377+
378+ if($this->_redirectaddr)
379+ {
380+ /* url was redirected, check if we've hit the max depth */
381+ if($this->maxredirs > $this->_redirectdepth)
382+ {
383+ if(!preg_match("|^".$URI_PARTS["scheme"]."://|", $this->_redirectaddr))
384+ $this->_redirectaddr = $this->_expandlinks($this->_redirectaddr,$URI_PARTS["scheme"]."://".$URI_PARTS["host"]);
385+
386+ // only follow redirect if it's on this site, or offsiteok is true
387+ if(preg_match("|^http://".preg_quote($this->host)."|i",$this->_redirectaddr) || $this->offsiteok)
388+ {
389+ /* follow the redirect */
390+ $this->_redirectdepth++;
391+ $this->lastredirectaddr=$this->_redirectaddr;
392+ if( strpos( $this->_redirectaddr, "?" ) > 0 )
393+ $this->fetch($this->_redirectaddr); // the redirect has changed the request method from post to get
394+ else
395+ $this->submit($this->_redirectaddr,$formvars, $formfiles);
396+ }
397+ }
398+ }
399+
400+ if($this->_framedepth < $this->maxframes && count($this->_frameurls) > 0)
401+ {
402+ $frameurls = $this->_frameurls;
403+ $this->_frameurls = array();
404+
405+ while(list(,$frameurl) = each($frameurls))
406+ {
407+ if($this->_framedepth < $this->maxframes)
408+ {
409+ $this->fetch($frameurl);
410+ $this->_framedepth++;
411+ }
412+ else
413+ break;
414+ }
415+ }
416+ return true;
417+ break;
418+
419+ default:
420+ // not a valid protocol
421+ $this->error = 'Invalid protocol "'.$URI_PARTS["scheme"].'"\n';
422+ return false;
423+ break;
424+ }
425+ return true;
426+ }
427+
428+/*======================================================================*\
429+ Function: fetchlinks
430+ Purpose: fetch the links from a web page
431+ Input: $URI where you are fetching from
432+ Output: $this->results an array of the URLs
433+\*======================================================================*/
434+
435+ function fetchlinks($URI)
436+ {
437+ if ($this->fetch($URI))
438+ {
439+ if($this->lastredirectaddr)
440+ $URI = $this->lastredirectaddr;
441+ if(is_array($this->results))
442+ {
443+ for($x=0;$x<count($this->results);$x++)
444+ $this->results[$x] = $this->_striplinks($this->results[$x]);
445+ }
446+ else
447+ $this->results = $this->_striplinks($this->results);
448+
449+ if($this->expandlinks)
450+ $this->results = $this->_expandlinks($this->results, $URI);
451+ return true;
452+ }
453+ else
454+ return false;
455+ }
456+
457+/*======================================================================*\
458+ Function: fetchform
459+ Purpose: fetch the form elements from a web page
460+ Input: $URI where you are fetching from
461+ Output: $this->results the resulting html form
462+\*======================================================================*/
463+
464+ function fetchform($URI)
465+ {
466+
467+ if ($this->fetch($URI))
468+ {
469+
470+ if(is_array($this->results))
471+ {
472+ for($x=0;$x<count($this->results);$x++)
473+ $this->results[$x] = $this->_stripform($this->results[$x]);
474+ }
475+ else
476+ $this->results = $this->_stripform($this->results);
477+
478+ return true;
479+ }
480+ else
481+ return false;
482+ }
483+
484+
485+/*======================================================================*\
486+ Function: fetchtext
487+ Purpose: fetch the text from a web page, stripping the links
488+ Input: $URI where you are fetching from
489+ Output: $this->results the text from the web page
490+\*======================================================================*/
491+
492+ function fetchtext($URI)
493+ {
494+ if($this->fetch($URI))
495+ {
496+ if(is_array($this->results))
497+ {
498+ for($x=0;$x<count($this->results);$x++)
499+ $this->results[$x] = $this->_striptext($this->results[$x]);
500+ }
501+ else
502+ $this->results = $this->_striptext($this->results);
503+ return true;
504+ }
505+ else
506+ return false;
507+ }
508+
509+/*======================================================================*\
510+ Function: submitlinks
511+ Purpose: grab links from a form submission
512+ Input: $URI where you are submitting from
513+ Output: $this->results an array of the links from the post
514+\*======================================================================*/
515+
516+ function submitlinks($URI, $formvars="", $formfiles="")
517+ {
518+ if($this->submit($URI,$formvars, $formfiles))
519+ {
520+ if($this->lastredirectaddr)
521+ $URI = $this->lastredirectaddr;
522+ if(is_array($this->results))
523+ {
524+ for($x=0;$x<count($this->results);$x++)
525+ {
526+ $this->results[$x] = $this->_striplinks($this->results[$x]);
527+ if($this->expandlinks)
528+ $this->results[$x] = $this->_expandlinks($this->results[$x],$URI);
529+ }
530+ }
531+ else
532+ {
533+ $this->results = $this->_striplinks($this->results);
534+ if($this->expandlinks)
535+ $this->results = $this->_expandlinks($this->results,$URI);
536+ }
537+ return true;
538+ }
539+ else
540+ return false;
541+ }
542+
543+/*======================================================================*\
544+ Function: submittext
545+ Purpose: grab text from a form submission
546+ Input: $URI where you are submitting from
547+ Output: $this->results the text from the web page
548+\*======================================================================*/
549+
550+ function submittext($URI, $formvars = "", $formfiles = "")
551+ {
552+ if($this->submit($URI,$formvars, $formfiles))
553+ {
554+ if($this->lastredirectaddr)
555+ $URI = $this->lastredirectaddr;
556+ if(is_array($this->results))
557+ {
558+ for($x=0;$x<count($this->results);$x++)
559+ {
560+ $this->results[$x] = $this->_striptext($this->results[$x]);
561+ if($this->expandlinks)
562+ $this->results[$x] = $this->_expandlinks($this->results[$x],$URI);
563+ }
564+ }
565+ else
566+ {
567+ $this->results = $this->_striptext($this->results);
568+ if($this->expandlinks)
569+ $this->results = $this->_expandlinks($this->results,$URI);
570+ }
571+ return true;
572+ }
573+ else
574+ return false;
575+ }
576+
577+
578+
579+/*======================================================================*\
580+ Function: set_submit_multipart
581+ Purpose: Set the form submission content type to
582+ multipart/form-data
583+\*======================================================================*/
584+ function set_submit_multipart()
585+ {
586+ $this->_submit_type = "multipart/form-data";
587+ }
588+
589+
590+/*======================================================================*\
591+ Function: set_submit_normal
592+ Purpose: Set the form submission content type to
593+ application/x-www-form-urlencoded
594+\*======================================================================*/
595+ function set_submit_normal()
596+ {
597+ $this->_submit_type = "application/x-www-form-urlencoded";
598+ }
599+
600+
601+
602+
603+/*======================================================================*\
604+ Private functions
605+\*======================================================================*/
606+
607+
608+/*======================================================================*\
609+ Function: _striplinks
610+ Purpose: strip the hyperlinks from an html document
611+ Input: $document document to strip.
612+ Output: $match an array of the links
613+\*======================================================================*/
614+
615+ function _striplinks($document)
616+ {
617+ preg_match_all("'<\s*a\s.*?href\s*=\s* # find <a href=
618+ ([\"\'])? # find single or double quote
619+ (?(1) (.*?)\\1 | ([^\s\>]+)) # if quote found, match up to next matching
620+ # quote, otherwise match up to next space
621+ 'isx",$document,$links);
622+
623+
624+ // catenate the non-empty matches from the conditional subpattern
625+
626+ while(list($key,$val) = each($links[2]))
627+ {
628+ if(!empty($val))
629+ $match[] = $val;
630+ }
631+
632+ while(list($key,$val) = each($links[3]))
633+ {
634+ if(!empty($val))
635+ $match[] = $val;
636+ }
637+
638+ // return the links
639+ return $match;
640+ }
641+
642+/*======================================================================*\
643+ Function: _stripform
644+ Purpose: strip the form elements from an html document
645+ Input: $document document to strip.
646+ Output: $match an array of the links
647+\*======================================================================*/
648+
649+ function _stripform($document)
650+ {
651+ preg_match_all("'<\/?(FORM|INPUT|SELECT|TEXTAREA|(OPTION))[^<>]*>(?(2)(.*(?=<\/?(option|select)[^<>]*>[\r\n]*)|(?=[\r\n]*))|(?=[\r\n]*))'Usi",$document,$elements);
652+
653+ // catenate the matches
654+ $match = implode("\r\n",$elements[0]);
655+
656+ // return the links
657+ return $match;
658+ }
659+
660+
661+
662+/*======================================================================*\
663+ Function: _striptext
664+ Purpose: strip the text from an html document
665+ Input: $document document to strip.
666+ Output: $text the resulting text
667+\*======================================================================*/
668+
669+ function _striptext($document)
670+ {
671+
672+ // I didn't use preg eval (//e) since that is only available in PHP 4.0.
673+ // so, list your entities one by one here. I included some of the
674+ // more common ones.
675+
676+ $search = array("'<script[^>]*?>.*?</script>'si", // strip out javascript
677+ "'<[\/\!]*?[^<>]*?>'si", // strip out html tags
678+ "'([\r\n])[\s]+'", // strip out white space
679+ "'&(quot|#34|#034|#x22);'i", // replace html entities
680+ "'&(amp|#38|#038|#x26);'i", // added hexadecimal values
681+ "'&(lt|#60|#060|#x3c);'i",
682+ "'&(gt|#62|#062|#x3e);'i",
683+ "'&(nbsp|#160|#xa0);'i",
684+ "'&(iexcl|#161);'i",
685+ "'&(cent|#162);'i",
686+ "'&(pound|#163);'i",
687+ "'&(copy|#169);'i",
688+ "'&(reg|#174);'i",
689+ "'&(deg|#176);'i",
690+ "'&(#39|#039|#x27);'",
691+ "'&(euro|#8364);'i", // europe
692+ "'&a(uml|UML);'", // german
693+ "'&o(uml|UML);'",
694+ "'&u(uml|UML);'",
695+ "'&A(uml|UML);'",
696+ "'&O(uml|UML);'",
697+ "'&U(uml|UML);'",
698+ "'&szlig;'i",
699+ );
700+ $replace = array( "",
701+ "",
702+ "\\1",
703+ "\"",
704+ "&",
705+ "<",
706+ ">",
707+ " ",
708+ chr(161),
709+ chr(162),
710+ chr(163),
711+ chr(169),
712+ chr(174),
713+ chr(176),
714+ chr(39),
715+ chr(128),
716+ /*
717+ * UTF8で表示出来ない文字をコードに変更
718+ * Marijuana
719+ */
720+ chr(228),
721+ chr(246),
722+ chr(252),
723+ chr(196),
724+ chr(214),
725+ chr(220),
726+ chr(223),
727+ );
728+
729+ $text = preg_replace($search,$replace,$document);
730+
731+ return $text;
732+ }
733+
734+/*======================================================================*\
735+ Function: _expandlinks
736+ Purpose: expand each link into a fully qualified URL
737+ Input: $links the links to qualify
738+ $URI the full URI to get the base from
739+ Output: $expandedLinks the expanded links
740+\*======================================================================*/
741+
742+ function _expandlinks($links,$URI)
743+ {
744+
745+ preg_match("/^[^\?]+/",$URI,$match);
746+
747+ $match = preg_replace("|/[^\/\.]+\.[^\/\.]+$|","",$match[0]);
748+ $match = preg_replace("|/$|","",$match);
749+ $match_part = parse_url($match);
750+ $match_root =
751+ $match_part["scheme"]."://".$match_part["host"];
752+
753+ $search = array( "|^http://".preg_quote($this->host)."|i",
754+ "|^(\/)|i",
755+ "|^(?!http://)(?!mailto:)|i",
756+ "|/\./|",
757+ "|/[^\/]+/\.\./|"
758+ );
759+
760+ $replace = array( "",
761+ $match_root."/",
762+ $match."/",
763+ "/",
764+ "/"
765+ );
766+
767+ $expandedLinks = preg_replace($search,$replace,$links);
768+
769+ return $expandedLinks;
770+ }
771+
772+/*======================================================================*\
773+ Function: _httprequest
774+ Purpose: go get the http data from the server
775+ Input: $url the url to fetch
776+ $fp the current open file pointer
777+ $URI the full URI
778+ $body body contents to send if any (POST)
779+ Output:
780+\*======================================================================*/
781+
782+ function _httprequest($url,$fp,$URI,$http_method,$content_type="",$body="")
783+ {
784+ $cookie_headers = '';
785+ if($this->passcookies && $this->_redirectaddr)
786+ $this->setcookies();
787+
788+ $URI_PARTS = parse_url($URI);
789+ if(empty($url))
790+ $url = "/";
791+ $headers = $http_method." ".$url." ".$this->_httpversion."\r\n";
792+ if(!empty($this->agent))
793+ $headers .= "User-Agent: ".$this->agent."\r\n";
794+ if(!empty($this->host) && !isset($this->rawheaders['Host'])) {
795+ $headers .= "Host: ".$this->host;
796+ /**
797+ * 80のときはポート番号を付けない
798+ * Marijuana
799+ */
800+ if(!empty($this->port) && $this->port != 80)
801+ $headers .= ":".$this->port;
802+ $headers .= "\r\n";
803+ }
804+ if(!empty($this->accept))
805+ $headers .= "Accept: ".$this->accept."\r\n";
806+ if(!empty($this->referer))
807+ $headers .= "Referer: ".$this->referer."\r\n";
808+ if(!empty($this->cookies))
809+ {
810+ if(!is_array($this->cookies))
811+ $this->cookies = (array)$this->cookies;
812+
813+ reset($this->cookies);
814+ if ( count($this->cookies) > 0 ) {
815+ $cookie_headers .= 'Cookie: ';
816+ foreach ( $this->cookies as $cookieKey => $cookieVal ) {
817+ $cookie_headers .= $cookieKey."=".urlencode($cookieVal)."; ";
818+ }
819+ $headers .= substr($cookie_headers,0,-2) . "\r\n";
820+ }
821+ }
822+ if(!empty($this->rawheaders))
823+ {
824+ if(!is_array($this->rawheaders))
825+ $this->rawheaders = (array)$this->rawheaders;
826+ while(list($headerKey,$headerVal) = each($this->rawheaders))
827+ $headers .= $headerKey.": ".$headerVal."\r\n";
828+ }
829+ if(!empty($content_type)) {
830+ $headers .= "Content-type: $content_type";
831+ if ($content_type == "multipart/form-data")
832+ $headers .= "; boundary=".$this->_mime_boundary;
833+ $headers .= "\r\n";
834+ }
835+ if(!empty($body))
836+ $headers .= "Content-length: ".strlen($body)."\r\n";
837+ if(!empty($this->user) || !empty($this->pass))
838+ $headers .= "Authorization: Basic ".base64_encode($this->user.":".$this->pass)."\r\n";
839+
840+ //add proxy auth headers
841+ if(!empty($this->proxy_user))
842+ $headers .= 'Proxy-Authorization: ' . 'Basic ' . base64_encode($this->proxy_user . ':' . $this->proxy_pass)."\r\n";
843+
844+
845+ $headers .= "\r\n";
846+
847+ // set the read timeout if needed
848+ if ($this->read_timeout > 0)
849+ socket_set_timeout($fp, $this->read_timeout);
850+ $this->timed_out = false;
851+
852+ fwrite($fp,$headers.$body,strlen($headers.$body));
853+
854+ $this->_redirectaddr = false;
855+ unset($this->headers);
856+
857+ while($currentHeader = fgets($fp,$this->_maxlinelen))
858+ {
859+ if ($this->read_timeout > 0 && $this->_check_timeout($fp))
860+ {
861+ $this->status=-100;
862+ return false;
863+ }
864+
865+ if($currentHeader == "\r\n")
866+ break;
867+
868+ // if a header begins with Location: or URI:, set the redirect
869+ if(preg_match("/^(Location:|URI:)/i",$currentHeader))
870+ {
871+ // get URL portion of the redirect
872+ preg_match("/^(Location:|URI:)[ ]+(.*)/i",chop($currentHeader),$matches);
873+ // look for :// in the Location header to see if hostname is included
874+ if(!preg_match("|\:\/\/|",$matches[2]))
875+ {
876+ // no host in the path, so prepend
877+ $this->_redirectaddr = $URI_PARTS["scheme"]."://".$this->host.":".$this->port;
878+ // eliminate double slash
879+ if(!preg_match("|^/|",$matches[2]))
880+ $this->_redirectaddr .= "/".$matches[2];
881+ else
882+ $this->_redirectaddr .= $matches[2];
883+ }
884+ else
885+ $this->_redirectaddr = $matches[2];
886+ }
887+
888+ if(preg_match("|^HTTP/|",$currentHeader))
889+ {
890+ if(preg_match("|^HTTP/[^\s]*\s(.*?)\s|",$currentHeader, $status))
891+ {
892+ $this->status= $status[1];
893+ }
894+ $this->response_code = $currentHeader;
895+ }
896+
897+ $this->headers[] = $currentHeader;
898+ }
899+
900+ $results = '';
901+ do {
902+ $_data = fread($fp, $this->maxlength);
903+ if (strlen($_data) == 0) {
904+ break;
905+ }
906+ $results .= $_data;
907+ } while(true);
908+
909+ if ($this->read_timeout > 0 && $this->_check_timeout($fp))
910+ {
911+ $this->status=-100;
912+ return false;
913+ }
914+
915+ // check if there is a a redirect meta tag
916+
917+ if(preg_match("'<meta[\s]*http-equiv[^>]*?content[\s]*=[\s]*[\"\']?\d+;[\s]*URL[\s]*=[\s]*([^\"\']*?)[\"\']?>'i",$results,$match))
918+
919+ {
920+ $this->_redirectaddr = $this->_expandlinks($match[1],$URI);
921+ }
922+
923+ // have we hit our frame depth and is there frame src to fetch?
924+ if(($this->_framedepth < $this->maxframes) && preg_match_all("'<frame\s+.*src[\s]*=[\'\"]?([^\'\"\>]+)'i",$results,$match))
925+ {
926+ $this->results[] = $results;
927+ for($x=0; $x<count($match[1]); $x++)
928+ $this->_frameurls[] = $this->_expandlinks($match[1][$x],$URI_PARTS["scheme"]."://".$this->host);
929+ }
930+ // have we already fetched framed content?
931+ elseif(is_array($this->results))
932+ $this->results[] = $results;
933+ // no framed content
934+ else
935+ $this->results = $results;
936+
937+ return true;
938+ }
939+
940+/*======================================================================*\
941+ Function: _httpsrequest
942+ Purpose: go get the https data from the server using curl
943+ Input: $url the url to fetch
944+ $URI the full URI
945+ $body body contents to send if any (POST)
946+ Output:
947+\*======================================================================*/
948+
949+ function _httpsrequest($url,$URI,$http_method,$content_type="",$body="")
950+ {
951+ if($this->passcookies && $this->_redirectaddr)
952+ $this->setcookies();
953+
954+ $headers = array();
955+
956+ $URI_PARTS = parse_url($URI);
957+ if(empty($url))
958+ $url = "/";
959+ // GET ... header not needed for curl
960+ //$headers[] = $http_method." ".$url." ".$this->_httpversion;
961+ if(!empty($this->agent))
962+ $headers[] = "User-Agent: ".$this->agent;
963+ if(!empty($this->host))
964+ /**
965+ * 80のときはポート番号を付けない
966+ * Marijuana
967+ */
968+ if(!empty($this->port) && $this->port != 80)
969+ $headers[] = "Host: ".$this->host.":".$this->port;
970+ else
971+ $headers[] = "Host: ".$this->host;
972+ if(!empty($this->accept))
973+ $headers[] = "Accept: ".$this->accept;
974+ if(!empty($this->referer))
975+ $headers[] = "Referer: ".$this->referer;
976+ if(!empty($this->cookies))
977+ {
978+ if(!is_array($this->cookies))
979+ $this->cookies = (array)$this->cookies;
980+
981+ reset($this->cookies);
982+ if ( count($this->cookies) > 0 ) {
983+ $cookie_str = 'Cookie: ';
984+ foreach ( $this->cookies as $cookieKey => $cookieVal ) {
985+ $cookie_str .= $cookieKey."=".urlencode($cookieVal)."; ";
986+ }
987+ $headers[] = substr($cookie_str,0,-2);
988+ }
989+ }
990+ if(!empty($this->rawheaders))
991+ {
992+ if(!is_array($this->rawheaders))
993+ $this->rawheaders = (array)$this->rawheaders;
994+ while(list($headerKey,$headerVal) = each($this->rawheaders))
995+ $headers[] = $headerKey.": ".$headerVal;
996+ }
997+ if(!empty($content_type)) {
998+ if ($content_type == "multipart/form-data")
999+ $headers[] = "Content-type: $content_type; boundary=".$this->_mime_boundary;
1000+ else
1001+ $headers[] = "Content-type: $content_type";
1002+ }
1003+ if(!empty($body))
1004+ $headers[] = "Content-length: ".strlen($body);
1005+ if(!empty($this->user) || !empty($this->pass))
1006+ $headers[] = "Authorization: BASIC ".base64_encode($this->user.":".$this->pass);
1007+
1008+ for($curr_header = 0; $curr_header < count($headers); $curr_header++) {
1009+ $safer_header = strtr( $headers[$curr_header], "\"", " " );
1010+ $cmdline_params .= " -H \"".$safer_header."\"";
1011+ }
1012+
1013+ if(!empty($body))
1014+ $cmdline_params .= " -d \"$body\"";
1015+
1016+ if($this->read_timeout > 0)
1017+ $cmdline_params .= " -m ".$this->read_timeout;
1018+
1019+ $headerfile = tempnam($temp_dir, "sno");
1020+
1021+ exec($this->curl_path." -k -D \"$headerfile\"".$cmdline_params." \"".escapeshellcmd($URI)."\"",$results,$return);
1022+
1023+ if($return)
1024+ {
1025+ $this->error = "Error: cURL could not retrieve the document, error $return.";
1026+ return false;
1027+ }
1028+
1029+
1030+ $results = implode("\r\n",$results);
1031+
1032+ $result_headers = file("$headerfile");
1033+
1034+ $this->_redirectaddr = false;
1035+ unset($this->headers);
1036+
1037+ for($currentHeader = 0; $currentHeader < count($result_headers); $currentHeader++)
1038+ {
1039+
1040+ // if a header begins with Location: or URI:, set the redirect
1041+ if(preg_match("/^(Location: |URI: )/i",$result_headers[$currentHeader]))
1042+ {
1043+ // get URL portion of the redirect
1044+ preg_match("/^(Location: |URI:)\s+(.*)/",chop($result_headers[$currentHeader]),$matches);
1045+ // look for :// in the Location header to see if hostname is included
1046+ if(!preg_match("|\:\/\/|",$matches[2]))
1047+ {
1048+ // no host in the path, so prepend
1049+ $this->_redirectaddr = $URI_PARTS["scheme"]."://".$this->host.":".$this->port;
1050+ // eliminate double slash
1051+ if(!preg_match("|^/|",$matches[2]))
1052+ $this->_redirectaddr .= "/".$matches[2];
1053+ else
1054+ $this->_redirectaddr .= $matches[2];
1055+ }
1056+ else
1057+ $this->_redirectaddr = $matches[2];
1058+ }
1059+
1060+ if(preg_match("|^HTTP/|",$result_headers[$currentHeader]))
1061+ $this->response_code = $result_headers[$currentHeader];
1062+
1063+ $this->headers[] = $result_headers[$currentHeader];
1064+ }
1065+
1066+ // check if there is a a redirect meta tag
1067+
1068+ if(preg_match("'<meta[\s]*http-equiv[^>]*?content[\s]*=[\s]*[\"\']?\d+;[\s]*URL[\s]*=[\s]*([^\"\']*?)[\"\']?>'i",$results,$match))
1069+ {
1070+ $this->_redirectaddr = $this->_expandlinks($match[1],$URI);
1071+ }
1072+
1073+ // have we hit our frame depth and is there frame src to fetch?
1074+ if(($this->_framedepth < $this->maxframes) && preg_match_all("'<frame\s+.*src[\s]*=[\'\"]?([^\'\"\>]+)'i",$results,$match))
1075+ {
1076+ $this->results[] = $results;
1077+ for($x=0; $x<count($match[1]); $x++)
1078+ $this->_frameurls[] = $this->_expandlinks($match[1][$x],$URI_PARTS["scheme"]."://".$this->host);
1079+ }
1080+ // have we already fetched framed content?
1081+ elseif(is_array($this->results))
1082+ $this->results[] = $results;
1083+ // no framed content
1084+ else
1085+ $this->results = $results;
1086+
1087+ unlink("$headerfile");
1088+
1089+ return true;
1090+ }
1091+
1092+/*======================================================================*\
1093+ Function: setcookies()
1094+ Purpose: set cookies for a redirection
1095+\*======================================================================*/
1096+
1097+ function setcookies()
1098+ {
1099+ for($x=0; $x<count($this->headers); $x++)
1100+ {
1101+ if(preg_match('/^set-cookie:[\s]+([^=]+)=([^;]+)/i', $this->headers[$x],$match))
1102+ $this->cookies[$match[1]] = urldecode($match[2]);
1103+ }
1104+ }
1105+
1106+
1107+/*======================================================================*\
1108+ Function: _check_timeout
1109+ Purpose: checks whether timeout has occurred
1110+ Input: $fp file pointer
1111+\*======================================================================*/
1112+
1113+ function _check_timeout($fp)
1114+ {
1115+ if ($this->read_timeout > 0) {
1116+ $fp_status = socket_get_status($fp);
1117+ if ($fp_status["timed_out"]) {
1118+ $this->timed_out = true;
1119+ return true;
1120+ }
1121+ }
1122+ return false;
1123+ }
1124+
1125+/*======================================================================*\
1126+ Function: _connect
1127+ Purpose: make a socket connection
1128+ Input: $fp file pointer
1129+\*======================================================================*/
1130+
1131+ function _connect(&$fp)
1132+ {
1133+ if(!empty($this->proxy_host) && !empty($this->proxy_port))
1134+ {
1135+ $this->_isproxy = true;
1136+
1137+ $host = $this->proxy_host;
1138+ $port = $this->proxy_port;
1139+ }
1140+ else
1141+ {
1142+ $host = $this->host;
1143+ $port = $this->port;
1144+ }
1145+
1146+ $this->status = 0;
1147+
1148+ if($fp = fsockopen(
1149+ $host,
1150+ $port,
1151+ $errno,
1152+ $errstr,
1153+ $this->_fp_timeout
1154+ ))
1155+ {
1156+ // socket connection succeeded
1157+
1158+ return true;
1159+ }
1160+ else
1161+ {
1162+ // socket connection failed
1163+ $this->status = $errno;
1164+ switch($errno)
1165+ {
1166+ case -3:
1167+ $this->error="socket creation failed (-3)";
1168+ case -4:
1169+ $this->error="dns lookup failure (-4)";
1170+ case -5:
1171+ $this->error="connection refused or timed out (-5)";
1172+ default:
1173+ $this->error="connection failed (".$errno.")";
1174+ }
1175+ return false;
1176+ }
1177+ }
1178+/*======================================================================*\
1179+ Function: _disconnect
1180+ Purpose: disconnect a socket connection
1181+ Input: $fp file pointer
1182+\*======================================================================*/
1183+
1184+ function _disconnect($fp)
1185+ {
1186+ return(fclose($fp));
1187+ }
1188+
1189+
1190+/*======================================================================*\
1191+ Function: _prepare_post_body
1192+ Purpose: Prepare post body according to encoding type
1193+ Input: $formvars - form variables
1194+ $formfiles - form upload files
1195+ Output: post body
1196+\*======================================================================*/
1197+
1198+ function _prepare_post_body($formvars, $formfiles)
1199+ {
1200+ settype($formvars, "array");
1201+ settype($formfiles, "array");
1202+ $postdata = '';
1203+
1204+ if (count($formvars) == 0 && count($formfiles) == 0)
1205+ return;
1206+
1207+ switch ($this->_submit_type) {
1208+ case "application/x-www-form-urlencoded":
1209+ reset($formvars);
1210+ while(list($key,$val) = each($formvars)) {
1211+ if (is_array($val) || is_object($val)) {
1212+ while (list($cur_key, $cur_val) = each($val)) {
1213+ $postdata .= urlencode($key)."[]=".urlencode($cur_val)."&";
1214+ }
1215+ } else
1216+ $postdata .= urlencode($key)."=".urlencode($val)."&";
1217+ }
1218+ break;
1219+
1220+ case "multipart/form-data":
1221+ $this->_mime_boundary = "Snoopy".md5(uniqid(microtime()));
1222+
1223+ reset($formvars);
1224+ while(list($key,$val) = each($formvars)) {
1225+ if (is_array($val) || is_object($val)) {
1226+ while (list($cur_key, $cur_val) = each($val)) {
1227+ $postdata .= "--".$this->_mime_boundary."\r\n";
1228+ $postdata .= "Content-Disposition: form-data; name=\"$key\[\]\"\r\n\r\n";
1229+ $postdata .= "$cur_val\r\n";
1230+ }
1231+ } else {
1232+ $postdata .= "--".$this->_mime_boundary."\r\n";
1233+ $postdata .= "Content-Disposition: form-data; name=\"$key\"\r\n\r\n";
1234+ $postdata .= "$val\r\n";
1235+ }
1236+ }
1237+
1238+ reset($formfiles);
1239+ while (list($field_name, $file_names) = each($formfiles)) {
1240+ settype($file_names, "array");
1241+ while (list(, $file_name) = each($file_names)) {
1242+ if (!is_readable($file_name)) continue;
1243+
1244+ $fp = fopen($file_name, "r");
1245+ $file_content = fread($fp, filesize($file_name));
1246+ fclose($fp);
1247+ $base_name = basename($file_name);
1248+
1249+ $postdata .= "--".$this->_mime_boundary."\r\n";
1250+ $postdata .= "Content-Disposition: form-data; name=\"$field_name\"; filename=\"$base_name\"\r\n\r\n";
1251+ $postdata .= "$file_content\r\n";
1252+ }
1253+ }
1254+ $postdata .= "--".$this->_mime_boundary."--\r\n";
1255+ break;
1256+ // XOOPS2 Hack begin
1257+ // Added on March 4, 2003 by onokazu@xoops.org
1258+ case "text/xml":
1259+ default:
1260+ $postdata = $formvars[0];
1261+ break;
1262+ // XOOPS2 Hack end
1263+ }
1264+
1265+ return $postdata;
1266+ }
1267+}
1268+
1269+?>