|
- <mxGraphModel>
- <root>
- <mxCell id="0">
- <JsonProperty as="data">
- {"spiderName":"未定义名称","submit-strategy":"random","threadCount":"1"}
- </JsonProperty>
- </mxCell>
- <mxCell id="1" parent="0"/>
- <mxCell id="2" value="开始" style="start" parent="1" vertex="1">
- <mxGeometry x="90" y="122" width="32" height="32" as="geometry"/>
- <JsonProperty as="data">
- {"shape":"start"}
- </JsonProperty>
- </mxCell>
- <mxCell id="5" value="开始抓取1" style="request" parent="1" vertex="1">
- <mxGeometry x="380" y="122" width="32" height="32" as="geometry"/>
- <JsonProperty as="data">
- {"value":"开始抓取1","loopVariableName":"","method":"GET","sleep":"","timeout":"","response-charset":"utf-8","retryCount":"","retryInterval":"","cookie-name":["Cookie"],"cookie-description":[""],"header-name":["User-Agent"],"header-description":[""],"body-type":"none","body-content-type":"text/plain","loopCount":"","url":"${'https://www.baidu.com/s?wd=site%3Axiaohongshu.com%20'+keyword+'&pn='+startIndex+'0&oq=site%3Axiaohongshu.com%20'+keyword+'&ie=utf-8&rsv_pq=e2f0a475000042c5&rsv_t=9ea9dVLpUJnYTMsMoLr%2FJEKf5u9kVwWw0ClcmcocojFr%2FDLXSOQyIydSLKU'}","proxy":"","cookie-value":["BIDUPSID=FFCCEFFD6AD71B7D82B27246697129D3; PSTM=1661740480; BAIDUID=6504A43EB0274812F809031B8671878C:FG=1; BD_UPN=12314753; BDUSS=NneHRaYzJNVnVCQ1lOa2RLNkozYlBNQkJMeHVqMzFOZm96SH5mQWlKajZia2RqSVFBQUFBJCQAAAAAAAAAAAEAAAB~B2D2tcjIscqntcSwrgAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAPrhH2P64R9jb0; BDUSS_BFESS=NneHRaYzJNVnVCQ1lOa2RLNkozYlBNQkJMeHVqMzFOZm96SH5mQWlKajZia2RqSVFBQUFBJCQAAAAAAAAAAAEAAAB~B2D2tcjIscqntcSwrgAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAPrhH2P64R9jb0; H_WISE_SIDS=110085_209568_211986_212870_215730_216941_219942_219946_221410_221796_222298_222396_223064_223683_224055_224065_224086_225202_225640_225854_226026_226087_226589_226674_226722_227117_227592_227614_227864_227932_228374_228535_228650_228668_228978_229060_229155_229286_229363_229526_229691_229867_230020; BDORZ=FFFB88E999055A3F8A630C64834BD6D0; BAIDUID_BFESS=6504A43EB0274812F809031B8671878C:FG=1; B64_BOT=1; BDRCVFR[C5g0hgaJYCf]=bvBYpeu9K4bTAR3Qh4-I0; delPer=0; PSINO=3; BA_HECTOR=al8h2h852ka584a4agak0ggo1hj2sn519; ZFY=ieqEe:Ai8741EeaFdWPdP8JYsVLPfdZb2pa5AnSzsKW8:C; channel=bd.pe8.net; COOKIE_SESSION=2832_0_3_3_8_8_0_0_3_3_0_1_2833_0_54_0_1664186476_0_1664186530%7C9%23114260_19_1663339171%7C6; baikeVisitId=9b4f3a04-d583-4052-9723-8095c345a108; BD_CK_SAM=1; sugstore=1; H_PS_645EC=f709ExtDBjjkFE38TE3k8%2B41MnOFC0dMOW6Pc5%2BTWxSUTxI8HeJCOlKpHClk30Xoq46OZjUQVWvG; BDRCVFR[C0p6oIjvx-c]=sycO_VPkq2bfjf4njRdn1DLg1nkgv99; H_PS_PSSID=37378_36548_36460_37354_37495_36885_37486_37396_36786_37447_37371; BDSVRTM=39"],"header-value":["Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/106.0.0.0 Safari/537.36"],"request-body":"","follow-redirect":"1","tls-validate":"1","cookie-auto-set":"1","repeat-enable":"0","shape":"request"}
- </JsonProperty>
- </mxCell>
- <mxCell id="369" value="定义变量" style="variable" parent="1" vertex="1">
- <mxGeometry x="510" y="122" width="32" height="32" as="geometry"/>
- <JsonProperty as="data">
- {"value":"定义变量","loopVariableName":"","ziloopVariableName":"","variable-name":["datalist"],"variable-description":[""],"loopCount":"","ziloopCount":"","variable-value":["${resp.selectors('#content_left > div')}"],"shape":"variable"}
- </JsonProperty>
- </mxCell>
- <mxCell id="371" value="" style="strokeWidth=2;sharp=1;" parent="1" source="5" target="369" edge="1">
- <mxGeometry relative="1" as="geometry"/>
- <JsonProperty as="data">
- {"value":"","exception-flow":"0","lineWidth":"2","line-style":"sharp","lineColor":"black","condition":"","transmit-variable":"1"}
- </JsonProperty>
- </mxCell>
- <mxCell id="392" value="定义变量" style="variable" parent="1" vertex="1">
- <mxGeometry x="220" y="122" width="32" height="32" as="geometry"/>
- <JsonProperty as="data">
- {"value":"定义变量","loopVariableName":"","ziloopVariableName":"","variable-name":["keyword","page","startIndex"],"variable-description":["","",""],"loopCount":"","ziloopCount":"","variable-value":["北京","${pageNoData}","${page=='0'?'':(page-1)}"],"shape":"variable"}
- </JsonProperty>
- </mxCell>
- <mxCell id="393" value="" style="strokeWidth=2;sharp=1;" parent="1" source="2" target="392" edge="1">
- <mxGeometry relative="1" as="geometry"/>
- <JsonProperty as="data">
- {"value":"","exception-flow":"0","lineWidth":"2","line-style":"sharp","lineColor":"black","condition":"","transmit-variable":"1"}
- </JsonProperty>
- </mxCell>
- <mxCell id="394" value="" style="strokeWidth=2;sharp=1;" parent="1" source="392" target="5" edge="1">
- <mxGeometry relative="1" as="geometry"/>
- <JsonProperty as="data">
- {"value":"","exception-flow":"0","lineWidth":"2","line-style":"sharp","lineColor":"black","condition":"","transmit-variable":"1"}
- </JsonProperty>
- </mxCell>
- <mxCell id="398" value="循环" style="loop" parent="1" vertex="1">
- <mxGeometry x="620" y="122" width="32" height="32" as="geometry"/>
- <JsonProperty as="data">
- {"value":"循环","loopItem":"","loopVariableName":"i","loopCount":"${datalist.size()}","loopStart":"0","loopEnd":"-1","awaitSleep":"0","shape":"loop"}
- </JsonProperty>
- </mxCell>
- <mxCell id="399" value="" style="strokeWidth=2;sharp=1;" parent="1" source="369" target="398" edge="1">
- <mxGeometry relative="1" as="geometry"/>
- <JsonProperty as="data">
- {"value":"","exception-flow":"0","lineWidth":"2","line-style":"sharp","lineColor":"black","condition":"","transmit-variable":"1"}
- </JsonProperty>
- </mxCell>
- <mxCell id="400" value="定义变量" style="variable" parent="1" vertex="1">
- <mxGeometry x="750" y="122" width="32" height="32" as="geometry"/>
- <JsonProperty as="data">
- {"value":"定义变量","loopVariableName":"","ziloopVariableName":"","variable-name":["title","url","source","publish_time","abstract"],"variable-description":["","","","",""],"loopCount":"","ziloopCount":"","variable-value":["${datalist.get(i).selector('.c-container > div > h3 > a').text()}","${datalist.get(i).selector('.c-container > div > h3 > a').attr('href')}","${\"小红书\"}","${datalist.get(i).selector('.c-color-gray2').text()}","${datalist.get(i).selector('.content-right_8Zs40').text()}"],"shape":"variable"}
- </JsonProperty>
- </mxCell>
- <mxCell id="402" value="" style="strokeWidth=2;sharp=1;" parent="1" source="398" target="400" edge="1">
- <mxGeometry relative="1" as="geometry"/>
- <JsonProperty as="data">
- {"value":"","exception-flow":"0","lineWidth":"2","line-style":"sharp","lineColor":"black","condition":"","transmit-variable":"1"}
- </JsonProperty>
- </mxCell>
- <mxCell id="404" value="输出" style="output" parent="1" vertex="1">
- <mxGeometry x="860" y="122" width="32" height="32" as="geometry"/>
- <JsonProperty as="data">
- {"value":"输出","loopVariableName":"","tableName":"","csvName":"","csvEncoding":"GBK","output-name":["title","url","source","publish_time","abstract","author"],"loopCount":"","output-value":["${strUtils.contains(title,keyword)?(strUtils.replaceAll(title,keyword,'<b class=\"key\" style=\"color:red\">'+keyword+'</b>')):(title)}","${url}","${source}","${publish_time}","${strUtils.contains(abstract,keyword)?(strUtils.replaceAll(abstract,keyword,'<b class=\"key\" style=\"color:red\">'+keyword+'</b>')):(abstract)}","${'-'}"],"output-all":"0","output-database":"0","output-csv":"0","shape":"output"}
- </JsonProperty>
- </mxCell>
- <mxCell id="405" value="" style="strokeWidth=2;sharp=1;" parent="1" source="400" target="404" edge="1">
- <mxGeometry relative="1" as="geometry"/>
- <JsonProperty as="data">
- {"value":"","exception-flow":"0","lineWidth":"2","line-style":"sharp","lineColor":"black","condition":"","transmit-variable":"1"}
- </JsonProperty>
- </mxCell>
- </root>
- </mxGraphModel>
|