- 论坛徽章:
- 1
|
回复 4# laputa73
还是不行啊,实在是尽力了,继续求帮助
- use LWP;
- my $ua = LWP::UserAgent->new(
- agent => 'Mozilla/5.0 (compatible; MSIE 10.0; Windows NT 6.2; WOW64; Trident/6.0)',
- cookie_jar => {},
- max_redirect => 30,
- requests_redirectable => ['GET','POST','HEAD'],
- );
-
- my $url1="http://www.ncbi.nlm.nih.gov/pmc/?term=boolean+network&report=imagesdocsum";#第一次地址栏访问
- my $url="http://www.ncbi.nlm.nih.gov/pmc";#用于post跳转
- #page num和gif totalnum,以及当前页的gif的url
- my $con=$ua->get($url1);
- $ua->cookie_jar->as_string=~/ncbi_sid\=(\w+)/;
- my $sid=$1;
- my $args={
- 'EntrezSystem2.PEntrez.DbConnector.Cmd' => 'PageChanged',
- 'EntrezSystem2.PEntrez.DbConnector.Db' => 'pmc',
- 'EntrezSystem2.PEntrez.DbConnector.IdsFromResult' =>'',
- 'EntrezSystem2.PEntrez.DbConnector.LastDb' => 'pmc',
- 'EntrezSystem2.PEntrez.DbConnector.LastIdsFromResult' => '',
- 'EntrezSystem2.PEntrez.DbConnector.LastQueryKey' => 2,
- 'EntrezSystem2.PEntrez.DbConnector.LastTabCmd' =>'',
- 'EntrezSystem2.PEntrez.DbConnector.LinkName' => '',
- 'EntrezSystem2.PEntrez.DbConnector.LinkReadableName' => '',
- 'EntrezSystem2.PEntrez.DbConnector.LinkSrcDb' => '',
- 'EntrezSystem2.PEntrez.DbConnector.QueryKey' => '',
- 'EntrezSystem2.PEntrez.DbConnector.TabCmd' => '',
- 'EntrezSystem2.PEntrez.DbConnector.Term' => 'boolean network',
- 'EntrezSystem2.PEntrez.Pmc.Pmc_PageController.PreviousPageName' => 'results',
- 'EntrezSystem2.PEntrez.Pmc.Pmc_ResultsPanel.EmailTab.Email' => '',
- 'EntrezSystem2.PEntrez.Pmc.Pmc_ResultsPanel.EmailTab.EmailCount ' => '',
- 'EntrezSystem2.PEntrez.Pmc.Pmc_ResultsPanel.EmailTab.EmailFormat' => '',
- 'EntrezSystem2.PEntrez.Pmc.Pmc_ResultsPanel.EmailTab.EmailQueryKey' => '',
- 'EntrezSystem2.PEntrez.Pmc.Pmc_ResultsPanel.EmailTab.EmailReport' => '',
- 'EntrezSystem2.PEntrez.Pmc.Pmc_ResultsPanel.EmailTab.EmailSort' => '',
- 'EntrezSystem2.PEntrez.Pmc.Pmc_ResultsPanel.EmailTab.EmailStart' => '',
- 'EntrezSystem2.PEntrez.Pmc.Pmc_ResultsPanel.EmailTab.EmailSubject' => '',
- 'EntrezSystem2.PEntrez.Pmc.Pmc_ResultsPanel.EmailTab.EmailText' => '',
- 'EntrezSystem2.PEntrez.Pmc.Pmc_ResultsPanel.EmailTab.QueryDescription' => '',
- 'EntrezSystem2.PEntrez.Pmc.Pmc_ResultsPanel.Entrez_Pager.cPage' =>1,
- 'EntrezSystem2.PEntrez.Pmc.Pmc_ResultsPanel.Entrez_Pager.CurrPage' =>2,
- 'EntrezSystem2.PEntrez.Pmc.Pmc_ResultsPanel.HistoryDisplay.Cmd ' =>'PageChanged',
- 'EntrezSystem2.PEntrez.Pmc.Pmc_ResultsPanel.Pmc_DisplayBar.FileFormat ' =>'imagesdocsum',
- 'EntrezSystem2.PEntrez.Pmc.Pmc_ResultsPanel.Pmc_DisplayBar.Format' => '',
- 'EntrezSystem2.PEntrez.Pmc.Pmc_ResultsPanel.Pmc_DisplayBar.LastFormat' => '',
- 'EntrezSystem2.PEntrez.Pmc.Pmc_ResultsPanel.Pmc_DisplayBar.LastPageSize' => 20,
- 'EntrezSystem2.PEntrez.Pmc.Pmc_ResultsPanel.Pmc_DisplayBar.LastPresentation' => 'imagesdocsum',
- 'EntrezSystem2.PEntrez.Pmc.Pmc_ResultsPanel.Pmc_DisplayBar.PageSize' =>20,
- 'EntrezSystem2.PEntrez.Pmc.Pmc_ResultsPanel.Pmc_DisplayBar.Presentation' =>'imagesdocsum',
- 'EntrezSystem2.PEntrez.Pmc.Pmc_ResultsPanel.Pmc_DisplayBar.sPageSize ' => 20,
- 'EntrezSystem2.PEntrez.Pmc.Pmc_ResultsPanel.Pmc_DisplayBar.sPageSize2' => 20,
- 'EntrezSystem2.PEntrez.Pmc.Pmc_ResultsPanel.Pmc_ResultsSearchController.ResultCount' => 400,
- 'EntrezSystem2.PEntrez.Pmc.Pmc_ResultsPanel.Pmc_ResultsSearchController.RunLastQuery' =>'',
- 'p$a' => 'EntrezSystem2.PEntrez.Pmc.Pmc_ResultsPanel.Entrez_Pager.Page',
- 'p$l' => 'EntrezSystem2',
- 'p$st' => 'pmc',
- 'term' => 'boolean network',
- # 'SessionId' => $sid,
- # 'Snapshot' => '/projects/entrez/Entrez@3.52',
- };
- my $abc=$ua->post($url,$args);
- #获取当前网页gif的url
- #print join "\n",@{&geturl($con->content)};#原始网页成功
- print join "\n",@{&geturl($abc->content)};#跳转失败
- sub geturl{
- my $content=shift;
- my @temp=();
- while($content=~/([^\"]+?\.gif)\"/sg){
- push @temp,$1;
- }
-
- return \@temp;
- }
复制代码 |
|