0

我需要获取带有已执行 js 的 html,为此我安装了 phantomjs,但在获取内容时,我仍然有旧的 html,带有旧数据,数据应该由 js 脚本处理,并且应该更改为带有某个类的 span 标签,该脚本应该执行。我正确理解,当我打开获取内容时,我应该获取带有处理数据的 DOM,这意味着标签跨度而不是 json 元素?我mssed什么?

public function getContentByPhantomjs($url)
{
    $client = Client::getInstance();

    $client->getEngine()->addOption('--ssl-protocol=any');
    $client->getEngine()->addOption('--ignore-ssl-errors=true');
    $client->getEngine()->addOption('--web-security=false');

    $client->getEngine()->setPath(MY_PATH . 'bin/phantomjs');

    $request = $client->getMessageFactory()->createRequest($url, 'GET');
    $response = $client->getMessageFactory()->createResponse();

    // Send the request
    $client->send($request, $response);

    return $response->getStatus() === 200 ? $response->getContent() : false;

}

但是js没有执行,我没有处理#pretty_json_id中的数据

    <div class="headline">

        <div id="pretty_json_id">
        <pre>                
          {"Company":"test"}
        </pre>
    </div>


<script>


    function ready() {
        element = document.getElementById('pretty_json_id').getElementsByTagName('pre');

        if (element.length > 0) {
            let parseJson = JSON.parse(element[0].innerHTML);
            let stringifyJson = JSON.stringify(parseJson, undefined, 4);
            element[0].innerHTML = syntaxHighlight(stringifyJson);
        }
    }

    function syntaxHighlight(json) {
        json = json.replace(/&/g, '&amp;').replace(/</g, '&lt;').replace(/>/g, '&gt;');
        return json.replace(/("(\\u[a-zA-Z0-9]{4}|\\[^u]|[^\\"])*"(\s*:)?|\b(true|false|null)\b|-?\d+(?:\.\d*)?(?:[eE][+\-]?\d+)?)/g, function (match) {
            var cls = 'number';
            if (/^"/.test(match)) {
                if (/:$/.test(match)) {
                    cls = 'key';
                } else {
                    cls = 'string';
                }
            } else if (/true|false/.test(match)) {
                cls = 'boolean';
            } else if (/null/.test(match)) {
                cls = 'null';
            }
            return '<span class="' + cls + '">' + match + '</span>';
        });
    }

    document.addEventListener("DOMContentLoaded", ready);
</script>

在浏览器中,everythink 工作。但我需要存在执行 js 的 html

日志信息

    2020-01-28T14:49:34 [DEBUG] CookieJar - Created but will not store cookies (use option '--cookies-file=<filename>' to enable persistent cookie storage)
2020-01-28T14:49:34 [DEBUG] Set  "http"  proxy to:  "" : 1080
2020-01-28T14:49:34 [DEBUG] Phantom - execute: Configuration
2020-01-28T14:49:34 [DEBUG]      0 objectName : ""
2020-01-28T14:49:34 [DEBUG]      1 cookiesFile : ""
2020-01-28T14:49:34 [DEBUG]      2 diskCacheEnabled : "true"
2020-01-28T14:49:34 [DEBUG]      3 maxDiskCacheSize : "-1"
2020-01-28T14:49:34 [DEBUG]      4 diskCachePath : ""
2020-01-28T14:49:34 [DEBUG]      5 ignoreSslErrors : "true"
2020-01-28T14:49:34 [DEBUG]      6 localUrlAccessEnabled : "true"
2020-01-28T14:49:34 [DEBUG]      7 localToRemoteUrlAccessEnabled : "false"
2020-01-28T14:49:34 [DEBUG]      8 outputEncoding : "UTF-8"
2020-01-28T14:49:34 [DEBUG]      9 proxyType : "http"
2020-01-28T14:49:34 [DEBUG]      10 proxy : ":1080"
2020-01-28T14:49:34 [DEBUG]      11 proxyAuth : ":"
2020-01-28T14:49:34 [DEBUG]      12 scriptEncoding : "UTF-8"
2020-01-28T14:49:34 [DEBUG]      13 webSecurityEnabled : "false"
2020-01-28T14:49:34 [DEBUG]      14 offlineStoragePath : ""
2020-01-28T14:49:34 [DEBUG]      15 localStoragePath : ""
2020-01-28T14:49:34 [DEBUG]      16 localStorageDefaultQuota : "-1"
2020-01-28T14:49:34 [DEBUG]      17 offlineStorageDefaultQuota : "-1"
2020-01-28T14:49:34 [DEBUG]      18 printDebugMessages : "true"
2020-01-28T14:49:34 [DEBUG]      19 javascriptCanOpenWindows : "true"
2020-01-28T14:49:34 [DEBUG]      20 javascriptCanCloseWindows : "true"
2020-01-28T14:49:34 [DEBUG]      21 sslProtocol : "any"
2020-01-28T14:49:34 [DEBUG]      22 sslCiphers : "ECDHE-ECDSA-AES128-GCM-SHA256:ECDHE-RSA-AES128-GCM-SHA256:DHE-RSA-AES128-GCM-SHA256:ECDHE-ECDSA-AES256-SHA:ECDHE-ECDSA-AES128-SHA:ECDHE-RSA-AES128-SHA:ECDHE-RSA-AES256-SHA:ECDHE-ECDSA-RC4-SHA:ECDHE-RSA-RC4-SHA:DHE-RSA-AES128-SHA:DHE-DSS-AES128-SHA:DHE-RSA-AES256-SHA:AES128-GCM-SHA256:AES128-SHA:AES256-SHA:DES-CBC3-SHA:RC4-SHA:RC4-MD5"
2020-01-28T14:49:34 [DEBUG]      23 sslCertificatesPath : ""
2020-01-28T14:49:34 [DEBUG]      24 sslClientCertificateFile : ""
2020-01-28T14:49:34 [DEBUG]      25 sslClientKeyFile : ""
2020-01-28T14:49:34 [DEBUG]      26 sslClientKeyPassphrase : ""
2020-01-28T14:49:34 [DEBUG]      27 webdriver : ":"
2020-01-28T14:49:34 [DEBUG]      28 webdriverLogFile : ""
2020-01-28T14:49:34 [DEBUG]      29 webdriverLogLevel : "INFO"
2020-01-28T14:49:34 [DEBUG]      30 webdriverSeleniumGridHub : ""
2020-01-28T14:49:34 [DEBUG] Phantom - execute: Script & Arguments
2020-01-28T14:49:34 [DEBUG]      script: "/tmp/1140ef46a6d6bfd239db"
2020-01-28T14:49:34 [DEBUG] Phantom - execute: Starting normal mode
2020-01-28T14:49:34 [DEBUG] WebPage - setupFrame ""
2020-01-28T14:49:34 [DEBUG] FileSystem - _open: ":/modules/fs.js" QMap(("mode", QVariant(QString, "r")))
2020-01-28T14:49:34 [DEBUG] FileSystem - _open: ":/modules/system.js" QMap(("mode", QVariant(QString, "r")))
2020-01-28T14:49:34 [DEBUG] FileSystem - _open: ":/modules/webpage.js" QMap(("mode", QVariant(QString, "r")))
2020-01-28T14:49:34 [DEBUG] WebPage - updateLoadingProgress: 10
2020-01-28T14:49:35 [DEBUG] CookieJar - Saved "PHPSESSID=rh333emlg3vfov3u66e4lbkdkc; domain=cdb.preem.local; path=/"
2020-01-28T14:49:35 [DEBUG] WebPage - updateLoadingProgress: 30
2020-01-28T14:49:35 [DEBUG] WebPage - updateLoadingProgress: 34
2020-01-28T14:49:35 [DEBUG] WebPage - setupFrame ""
2020-01-28T14:49:35 [WARNING] QNetworkDiskCache::prepare() unable to open temporary file
2020-01-28T14:49:35 [WARNING] QNetworkDiskCache::prepare() unable to open temporary file
2020-01-28T14:49:35 [DEBUG] WebPage - updateLoadingProgress: 37
2020-01-28T14:49:35 [DEBUG] WebPage - updateLoadingProgress: 40
2020-01-28T14:49:35 [DEBUG] WebPage - updateLoadingProgress: 43
2020-01-28T14:49:35 [DEBUG] WebPage - updateLoadingProgress: 100
2020-01-28T14:49:35 [DEBUG] WebPage - evaluateJavaScript "(function() { return (function () {\n    \n    var styles = {};\n    \n    for(var property in styles) {\n        document.body.style[property] = styles[property];\n    }\n})(); })()"
2020-01-28T14:49:35 [DEBUG] WebPage - evaluateJavaScript result QVariant(Invalid)
2020-01-28T14:49:35 [DEBUG] WebPage - setupFrame ""
2020-01-28T14:49:35 [DEBUG] WebPage - evaluateJavaScript "(function() { return (function () {\n            return document.getElementsByTagName('html')[0].innerHTML;\n        })(); })()"
2020-01-28T14:49:35 [DEBUG] WebPage - evaluateJavaScript result QVariant(QString, "my html")
2020-01-28T13:49:34 [INFO] PhantomJS - Set viewport size ~ width: 1366 height: 768\n2020-01-28T14:49:35 [DEBUG] WebPage - setupFrame ""
2020-01-28T14:49:35 [DEBUG] WebPage - updateLoadingProgress: 10
2020-01-28T14:49:35 [DEBUG] WebPage - setupFrame ""
2020-01-28T14:49:35 [DEBUG] WebPage - updateLoadingProgress: 100
2020-01-28T14:49:35 [DEBUG] WebPage - setupFrame ""
2020-01-28T14:49:35 [DEBUG] FileSystem - _open: ":/modules/fs.js" QMap(("mode", QVariant(QString, "r")))
2020-01-28T14:49:35 [DEBUG] FileSystem - _open: ":/modules/system.js" QMap(("mode", QVariant(QString, "r")))
2020-01-28T14:49:35 [DEBUG] FileSystem - _open: ":/modules/webpage.js" QMap(("mode", QVariant(QString, "r")))
2020-01-28T14:49:35 [DEBUG] WebPage - updateLoadingProgress: 10
2020-01-28T14:49:35 [DEBUG] WebPage - setupFrame ""
2020-01-28T14:49:35 [DEBUG] FileSystem - _open: ":/modules/fs.js" QMap(("mode", QVariant(QString, "r")))
2020-01-28T14:49:35 [DEBUG] FileSystem - _open: ":/modules/system.js" QMap(("mode", QVariant(QString, "r")))
2020-01-28T14:49:35 [DEBUG] FileSystem - _open: ":/modules/webpage.js" QMap(("mode", QVariant(QString, "r")))
2020-01-28T14:49:35 [DEBUG] WebPage - updateLoadingProgress: 100
2020-01-28T14:49:35 [DEBUG] CookieJar - Purged (session) "PHPSESSID=rh333emlg3vfov3u66e4lbkdkc; domain=my.local; path=/"
4

1 回答 1

0

问题出在let变量上,在我将其替换为var一切正常后

于 2020-01-28T15:03:13.173 回答