123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709 |
- <?php
- /*
- * This file is part of the Symfony package.
- *
- * (c) Fabien Potencier <fabien@symfony.com>
- *
- * For the full copyright and license information, please view the LICENSE
- * file that was distributed with this source code.
- */
- namespace Symfony\Component\BrowserKit;
- use Symfony\Component\BrowserKit\Exception\BadMethodCallException;
- use Symfony\Component\DomCrawler\Crawler;
- use Symfony\Component\DomCrawler\Form;
- use Symfony\Component\DomCrawler\Link;
- use Symfony\Component\Process\PhpProcess;
- /**
- * Simulates a browser.
- *
- * To make the actual request, you need to implement the doRequest() method.
- *
- * If you want to be able to run requests in their own process (insulated flag),
- * you need to also implement the getScript() method.
- *
- * @author Fabien Potencier <fabien@symfony.com>
- */
- abstract class AbstractBrowser
- {
- protected $history;
- protected $cookieJar;
- protected $server = [];
- protected $internalRequest;
- protected $request;
- protected $internalResponse;
- protected $response;
- protected $crawler;
- protected $insulated = false;
- protected $redirect;
- protected $followRedirects = true;
- protected $followMetaRefresh = false;
- private $maxRedirects = -1;
- private $redirectCount = 0;
- private $redirects = [];
- private $isMainRequest = true;
- /**
- * @param array $server The server parameters (equivalent of $_SERVER)
- */
- public function __construct(array $server = [], History $history = null, CookieJar $cookieJar = null)
- {
- $this->setServerParameters($server);
- $this->history = $history ?: new History();
- $this->cookieJar = $cookieJar ?: new CookieJar();
- }
- /**
- * Sets whether to automatically follow redirects or not.
- */
- public function followRedirects(bool $followRedirects = true)
- {
- $this->followRedirects = $followRedirects;
- }
- /**
- * Sets whether to automatically follow meta refresh redirects or not.
- */
- public function followMetaRefresh(bool $followMetaRefresh = true)
- {
- $this->followMetaRefresh = $followMetaRefresh;
- }
- /**
- * Returns whether client automatically follows redirects or not.
- *
- * @return bool
- */
- public function isFollowingRedirects()
- {
- return $this->followRedirects;
- }
- /**
- * Sets the maximum number of redirects that crawler can follow.
- */
- public function setMaxRedirects(int $maxRedirects)
- {
- $this->maxRedirects = $maxRedirects < 0 ? -1 : $maxRedirects;
- $this->followRedirects = -1 != $this->maxRedirects;
- }
- /**
- * Returns the maximum number of redirects that crawler can follow.
- *
- * @return int
- */
- public function getMaxRedirects()
- {
- return $this->maxRedirects;
- }
- /**
- * Sets the insulated flag.
- *
- * @param bool $insulated Whether to insulate the requests or not
- *
- * @throws \RuntimeException When Symfony Process Component is not installed
- */
- public function insulate(bool $insulated = true)
- {
- if ($insulated && !class_exists(\Symfony\Component\Process\Process::class)) {
- throw new \LogicException('Unable to isolate requests as the Symfony Process Component is not installed.');
- }
- $this->insulated = $insulated;
- }
- /**
- * Sets server parameters.
- *
- * @param array $server An array of server parameters
- */
- public function setServerParameters(array $server)
- {
- $this->server = array_merge([
- 'HTTP_USER_AGENT' => 'Symfony BrowserKit',
- ], $server);
- }
- /**
- * Sets single server parameter.
- */
- public function setServerParameter(string $key, string $value)
- {
- $this->server[$key] = $value;
- }
- /**
- * Gets single server parameter for specified key.
- *
- * @param mixed $default A default value when key is undefined
- *
- * @return mixed A value of the parameter
- */
- public function getServerParameter(string $key, $default = '')
- {
- return $this->server[$key] ?? $default;
- }
- public function xmlHttpRequest(string $method, string $uri, array $parameters = [], array $files = [], array $server = [], string $content = null, bool $changeHistory = true): Crawler
- {
- $this->setServerParameter('HTTP_X_REQUESTED_WITH', 'XMLHttpRequest');
- try {
- return $this->request($method, $uri, $parameters, $files, $server, $content, $changeHistory);
- } finally {
- unset($this->server['HTTP_X_REQUESTED_WITH']);
- }
- }
- /**
- * Returns the History instance.
- *
- * @return History A History instance
- */
- public function getHistory()
- {
- return $this->history;
- }
- /**
- * Returns the CookieJar instance.
- *
- * @return CookieJar A CookieJar instance
- */
- public function getCookieJar()
- {
- return $this->cookieJar;
- }
- /**
- * Returns the current Crawler instance.
- *
- * @return Crawler A Crawler instance
- */
- public function getCrawler()
- {
- if (null === $this->crawler) {
- throw new BadMethodCallException(sprintf('The "request()" method must be called before "%s()".', __METHOD__));
- }
- return $this->crawler;
- }
- /**
- * Returns the current BrowserKit Response instance.
- *
- * @return Response A BrowserKit Response instance
- */
- public function getInternalResponse()
- {
- if (null === $this->internalResponse) {
- throw new BadMethodCallException(sprintf('The "request()" method must be called before "%s()".', __METHOD__));
- }
- return $this->internalResponse;
- }
- /**
- * Returns the current origin response instance.
- *
- * The origin response is the response instance that is returned
- * by the code that handles requests.
- *
- * @return object A response instance
- *
- * @see doRequest()
- */
- public function getResponse()
- {
- if (null === $this->response) {
- throw new BadMethodCallException(sprintf('The "request()" method must be called before "%s()".', __METHOD__));
- }
- return $this->response;
- }
- /**
- * Returns the current BrowserKit Request instance.
- *
- * @return Request A BrowserKit Request instance
- */
- public function getInternalRequest()
- {
- if (null === $this->internalRequest) {
- throw new BadMethodCallException(sprintf('The "request()" method must be called before "%s()".', __METHOD__));
- }
- return $this->internalRequest;
- }
- /**
- * Returns the current origin Request instance.
- *
- * The origin request is the request instance that is sent
- * to the code that handles requests.
- *
- * @return object A Request instance
- *
- * @see doRequest()
- */
- public function getRequest()
- {
- if (null === $this->request) {
- throw new BadMethodCallException(sprintf('The "request()" method must be called before "%s()".', __METHOD__));
- }
- return $this->request;
- }
- /**
- * Clicks on a given link.
- *
- * @return Crawler
- */
- public function click(Link $link)
- {
- if ($link instanceof Form) {
- return $this->submit($link);
- }
- return $this->request($link->getMethod(), $link->getUri());
- }
- /**
- * Clicks the first link (or clickable image) that contains the given text.
- *
- * @param string $linkText The text of the link or the alt attribute of the clickable image
- */
- public function clickLink(string $linkText): Crawler
- {
- if (null === $this->crawler) {
- throw new BadMethodCallException(sprintf('The "request()" method must be called before "%s()".', __METHOD__));
- }
- return $this->click($this->crawler->selectLink($linkText)->link());
- }
- /**
- * Submits a form.
- *
- * @param array $values An array of form field values
- * @param array $serverParameters An array of server parameters
- *
- * @return Crawler
- */
- public function submit(Form $form, array $values = [], array $serverParameters = [])
- {
- $form->setValues($values);
- return $this->request($form->getMethod(), $form->getUri(), $form->getPhpValues(), $form->getPhpFiles(), $serverParameters);
- }
- /**
- * Finds the first form that contains a button with the given content and
- * uses it to submit the given form field values.
- *
- * @param string $button The text content, id, value or name of the form <button> or <input type="submit">
- * @param array $fieldValues Use this syntax: ['my_form[name]' => '...', 'my_form[email]' => '...']
- * @param string $method The HTTP method used to submit the form
- * @param array $serverParameters These values override the ones stored in $_SERVER (HTTP headers must include an HTTP_ prefix as PHP does)
- */
- public function submitForm(string $button, array $fieldValues = [], string $method = 'POST', array $serverParameters = []): Crawler
- {
- if (null === $this->crawler) {
- throw new BadMethodCallException(sprintf('The "request()" method must be called before "%s()".', __METHOD__));
- }
- $buttonNode = $this->crawler->selectButton($button);
- $form = $buttonNode->form($fieldValues, $method);
- return $this->submit($form, [], $serverParameters);
- }
- /**
- * Calls a URI.
- *
- * @param string $method The request method
- * @param string $uri The URI to fetch
- * @param array $parameters The Request parameters
- * @param array $files The files
- * @param array $server The server parameters (HTTP headers are referenced with an HTTP_ prefix as PHP does)
- * @param string $content The raw body data
- * @param bool $changeHistory Whether to update the history or not (only used internally for back(), forward(), and reload())
- *
- * @return Crawler
- */
- public function request(string $method, string $uri, array $parameters = [], array $files = [], array $server = [], string $content = null, bool $changeHistory = true)
- {
- if ($this->isMainRequest) {
- $this->redirectCount = 0;
- } else {
- ++$this->redirectCount;
- }
- $originalUri = $uri;
- $uri = $this->getAbsoluteUri($uri);
- $server = array_merge($this->server, $server);
- if (!empty($server['HTTP_HOST']) && null === parse_url($originalUri, \PHP_URL_HOST)) {
- $uri = preg_replace('{^(https?\://)'.preg_quote($this->extractHost($uri)).'}', '${1}'.$server['HTTP_HOST'], $uri);
- }
- if (isset($server['HTTPS']) && null === parse_url($originalUri, \PHP_URL_SCHEME)) {
- $uri = preg_replace('{^'.parse_url($uri, \PHP_URL_SCHEME).'}', $server['HTTPS'] ? 'https' : 'http', $uri);
- }
- if (!isset($server['HTTP_REFERER']) && !$this->history->isEmpty()) {
- $server['HTTP_REFERER'] = $this->history->current()->getUri();
- }
- if (empty($server['HTTP_HOST'])) {
- $server['HTTP_HOST'] = $this->extractHost($uri);
- }
- $server['HTTPS'] = 'https' == parse_url($uri, \PHP_URL_SCHEME);
- $this->internalRequest = new Request($uri, $method, $parameters, $files, $this->cookieJar->allValues($uri), $server, $content);
- $this->request = $this->filterRequest($this->internalRequest);
- if (true === $changeHistory) {
- $this->history->add($this->internalRequest);
- }
- if ($this->insulated) {
- $this->response = $this->doRequestInProcess($this->request);
- } else {
- $this->response = $this->doRequest($this->request);
- }
- $this->internalResponse = $this->filterResponse($this->response);
- $this->cookieJar->updateFromResponse($this->internalResponse, $uri);
- $status = $this->internalResponse->getStatusCode();
- if ($status >= 300 && $status < 400) {
- $this->redirect = $this->internalResponse->getHeader('Location');
- } else {
- $this->redirect = null;
- }
- if ($this->followRedirects && $this->redirect) {
- $this->redirects[serialize($this->history->current())] = true;
- return $this->crawler = $this->followRedirect();
- }
- $this->crawler = $this->createCrawlerFromContent($this->internalRequest->getUri(), $this->internalResponse->getContent(), $this->internalResponse->getHeader('Content-Type') ?? '');
- // Check for meta refresh redirect
- if ($this->followMetaRefresh && null !== $redirect = $this->getMetaRefreshUrl()) {
- $this->redirect = $redirect;
- $this->redirects[serialize($this->history->current())] = true;
- $this->crawler = $this->followRedirect();
- }
- return $this->crawler;
- }
- /**
- * Makes a request in another process.
- *
- * @param object $request An origin request instance
- *
- * @return object An origin response instance
- *
- * @throws \RuntimeException When processing returns exit code
- */
- protected function doRequestInProcess($request)
- {
- $deprecationsFile = tempnam(sys_get_temp_dir(), 'deprec');
- putenv('SYMFONY_DEPRECATIONS_SERIALIZE='.$deprecationsFile);
- $_ENV['SYMFONY_DEPRECATIONS_SERIALIZE'] = $deprecationsFile;
- $process = new PhpProcess($this->getScript($request), null, null);
- $process->run();
- if (file_exists($deprecationsFile)) {
- $deprecations = file_get_contents($deprecationsFile);
- unlink($deprecationsFile);
- foreach ($deprecations ? unserialize($deprecations) : [] as $deprecation) {
- if ($deprecation[0]) {
- // unsilenced on purpose
- trigger_error($deprecation[1], \E_USER_DEPRECATED);
- } else {
- @trigger_error($deprecation[1], \E_USER_DEPRECATED);
- }
- }
- }
- if (!$process->isSuccessful() || !preg_match('/^O\:\d+\:/', $process->getOutput())) {
- throw new \RuntimeException(sprintf('OUTPUT: %s ERROR OUTPUT: %s.', $process->getOutput(), $process->getErrorOutput()));
- }
- return unserialize($process->getOutput());
- }
- /**
- * Makes a request.
- *
- * @param object $request An origin request instance
- *
- * @return object An origin response instance
- */
- abstract protected function doRequest($request);
- /**
- * Returns the script to execute when the request must be insulated.
- *
- * @param object $request An origin request instance
- *
- * @throws \LogicException When this abstract class is not implemented
- */
- protected function getScript($request)
- {
- throw new \LogicException('To insulate requests, you need to override the getScript() method.');
- }
- /**
- * Filters the BrowserKit request to the origin one.
- *
- * @return object An origin request instance
- */
- protected function filterRequest(Request $request)
- {
- return $request;
- }
- /**
- * Filters the origin response to the BrowserKit one.
- *
- * @param object $response The origin response to filter
- *
- * @return Response An BrowserKit Response instance
- */
- protected function filterResponse($response)
- {
- return $response;
- }
- /**
- * Creates a crawler.
- *
- * This method returns null if the DomCrawler component is not available.
- *
- * @return Crawler|null
- */
- protected function createCrawlerFromContent(string $uri, string $content, string $type)
- {
- if (!class_exists(Crawler::class)) {
- return null;
- }
- $crawler = new Crawler(null, $uri);
- $crawler->addContent($content, $type);
- return $crawler;
- }
- /**
- * Goes back in the browser history.
- *
- * @return Crawler
- */
- public function back()
- {
- do {
- $request = $this->history->back();
- } while (\array_key_exists(serialize($request), $this->redirects));
- return $this->requestFromRequest($request, false);
- }
- /**
- * Goes forward in the browser history.
- *
- * @return Crawler
- */
- public function forward()
- {
- do {
- $request = $this->history->forward();
- } while (\array_key_exists(serialize($request), $this->redirects));
- return $this->requestFromRequest($request, false);
- }
- /**
- * Reloads the current browser.
- *
- * @return Crawler
- */
- public function reload()
- {
- return $this->requestFromRequest($this->history->current(), false);
- }
- /**
- * Follow redirects?
- *
- * @return Crawler
- *
- * @throws \LogicException If request was not a redirect
- */
- public function followRedirect()
- {
- if (empty($this->redirect)) {
- throw new \LogicException('The request was not redirected.');
- }
- if (-1 !== $this->maxRedirects) {
- if ($this->redirectCount > $this->maxRedirects) {
- $this->redirectCount = 0;
- throw new \LogicException(sprintf('The maximum number (%d) of redirections was reached.', $this->maxRedirects));
- }
- }
- $request = $this->internalRequest;
- if (\in_array($this->internalResponse->getStatusCode(), [301, 302, 303])) {
- $method = 'GET';
- $files = [];
- $content = null;
- } else {
- $method = $request->getMethod();
- $files = $request->getFiles();
- $content = $request->getContent();
- }
- if ('GET' === strtoupper($method)) {
- // Don't forward parameters for GET request as it should reach the redirection URI
- $parameters = [];
- } else {
- $parameters = $request->getParameters();
- }
- $server = $request->getServer();
- $server = $this->updateServerFromUri($server, $this->redirect);
- $this->isMainRequest = false;
- $response = $this->request($method, $this->redirect, $parameters, $files, $server, $content);
- $this->isMainRequest = true;
- return $response;
- }
- /**
- * @see https://dev.w3.org/html5/spec-preview/the-meta-element.html#attr-meta-http-equiv-refresh
- */
- private function getMetaRefreshUrl(): ?string
- {
- $metaRefresh = $this->getCrawler()->filter('head meta[http-equiv="refresh"]');
- foreach ($metaRefresh->extract(['content']) as $content) {
- if (preg_match('/^\s*0\s*;\s*URL\s*=\s*(?|\'([^\']++)|"([^"]++)|([^\'"].*))/i', $content, $m)) {
- return str_replace("\t\r\n", '', rtrim($m[1]));
- }
- }
- return null;
- }
- /**
- * Restarts the client.
- *
- * It flushes history and all cookies.
- */
- public function restart()
- {
- $this->cookieJar->clear();
- $this->history->clear();
- }
- /**
- * Takes a URI and converts it to absolute if it is not already absolute.
- *
- * @param string $uri A URI
- *
- * @return string An absolute URI
- */
- protected function getAbsoluteUri(string $uri)
- {
- // already absolute?
- if (0 === strpos($uri, 'http://') || 0 === strpos($uri, 'https://')) {
- return $uri;
- }
- if (!$this->history->isEmpty()) {
- $currentUri = $this->history->current()->getUri();
- } else {
- $currentUri = sprintf('http%s://%s/',
- isset($this->server['HTTPS']) ? 's' : '',
- $this->server['HTTP_HOST'] ?? 'localhost'
- );
- }
- // protocol relative URL
- if (0 === strpos($uri, '//')) {
- return parse_url($currentUri, \PHP_URL_SCHEME).':'.$uri;
- }
- // anchor or query string parameters?
- if (!$uri || '#' == $uri[0] || '?' == $uri[0]) {
- return preg_replace('/[#?].*?$/', '', $currentUri).$uri;
- }
- if ('/' !== $uri[0]) {
- $path = parse_url($currentUri, \PHP_URL_PATH);
- if ('/' !== substr($path, -1)) {
- $path = substr($path, 0, strrpos($path, '/') + 1);
- }
- $uri = $path.$uri;
- }
- return preg_replace('#^(.*?//[^/]+)\/.*$#', '$1', $currentUri).$uri;
- }
- /**
- * Makes a request from a Request object directly.
- *
- * @param bool $changeHistory Whether to update the history or not (only used internally for back(), forward(), and reload())
- *
- * @return Crawler
- */
- protected function requestFromRequest(Request $request, $changeHistory = true)
- {
- return $this->request($request->getMethod(), $request->getUri(), $request->getParameters(), $request->getFiles(), $request->getServer(), $request->getContent(), $changeHistory);
- }
- private function updateServerFromUri(array $server, string $uri): array
- {
- $server['HTTP_HOST'] = $this->extractHost($uri);
- $scheme = parse_url($uri, \PHP_URL_SCHEME);
- $server['HTTPS'] = null === $scheme ? $server['HTTPS'] : 'https' == $scheme;
- unset($server['HTTP_IF_NONE_MATCH'], $server['HTTP_IF_MODIFIED_SINCE']);
- return $server;
- }
- private function extractHost(string $uri): ?string
- {
- $host = parse_url($uri, \PHP_URL_HOST);
- if ($port = parse_url($uri, \PHP_URL_PORT)) {
- return $host.':'.$port;
- }
- return $host;
- }
- }
|