www.webdeveloper.com
Results 1 to 3 of 3

Thread: how to extract images from web page given a URL?

  1. #1
    Join Date
    May 2012
    Posts
    1

    how to extract images from web page given a URL?

    I would like to submit a url and extract the images of this web page submitted. How to do this using javascript? If anyone knows I ask that you create a basic script that I can understand.


    Thanks,

    Marcelo
    Rio - Brazil

  2. #2
    Join Date
    Jul 2008
    Location
    urbana, il
    Posts
    2,787
    it's easy with yql:


    Code:
    function addScript(u){var sc2=document.createElement('script'); sc2.src=u;
      return document.getElementsByTagName('*')[1].appendChild(sc2);
    }
    
    
    
    function grabImgs(url, cb){
     var url="http://query.yahooapis.com/v1/public/yql?q=select%20*%20from%20html%20where%20url%3D%22"+
       encodeURIComponent(url)+
       "%22%20and%0A%20%20%20%20%20%20xpath%3D'%2F%2Fimg'&format=json&callback="+
       ( (cb && cb.name) || cb ||"console.log");
    
     return  addScript(url);
    
    }
    
    function myCB(data){
      alert(JSON.stringify(   data.query.results.img    ,null,"\t"))
    }
    
    //demo
    grabImgs("http://www.webdeveloper.com/forum/showthread.php?t=260425", myCB)
    Last edited by rnd me; 05-11-2012 at 12:16 AM.
    Create, Share, and Debug HTML pages and snippets with a cool new web app I helped create: pagedemos.com

  3. #3
    Join Date
    Oct 2006
    Posts
    939
    i guess i can understand that. But my interpretation doesn't work with IE
    HTML Code:
    <!DOCTYPE HTML PUBLIC "-//W3C//DTD HTML 4.01//EN"
    	"http://www.w3.org/TR/html4/strict.dtd">
    <HTML>
    <HEAD><TITLE>Sa12-17pm37</TITLE>
    <META http-equiv=Content-Type content="text/html; charset=UTF-8">
    <STYLE type=text/CSS>
    
    </STYLE>
    <SCRIPT type="text/javascript">
    
    </SCRIPT>
    <META content="MSHTML 6.00.2900.2963" name=GENERATOR></HEAD>
    <BODY>
    <div>
    <SCRIPT type="text/javascript">
    var pcs='cute,Pictures,topwalls,wallpapers,wallpaper,creepy,EarthPorn,photos,pics,mfw,gif,gifs,reactiongifs';
    	pcs=pcs.split(',')
    
    var po='http://imgur.com/r/'	
    for(i=0;i<pcs.length;i++){document.write('<span onclick="grabImgs(\'http://imgur.com/r/'+pcs[i]+'\',myCB);this.style.backgroundColor=\'pink\'" style="color:blue;cursor:pointer">'+pcs[i]+'</span> ')}
    </SCRIPT>
    </div><div id="pics" style="text-align:center;min-height:500px"></div>
    <SCRIPT type="text/javascript">
    var imgu='http://imgur.com/r/'
    function addScript(u){var sc2=document.createElement('script'); sc2.src=u;
    	  return document.getElementsByTagName('*')[1].appendChild(sc2);
    }
    
    function grabImgs(url, cb){
      while(document.getElementById('pics').hasChildNodes()){document.getElementById('pics').removeChild(document.getElementById('pics').childNodes[0]);}
     var url="http://query.yahooapis.com/v1/public/yql?q=select%20*%20from%20html%20where%20url%3D%22"+
       encodeURIComponent(url)+
       "%22%20and%0A%20%20%20%20%20%20xpath%3D'%2F%2Fimg'&format=json&callback="+
       ( (cb && cb.name) || cb ||"console.log");
     return  addScript(url);
    }
    
    function myCB(data){
      var k=JSON.stringify(   data.query.results.img    ,null,null)
    	var n=k=k.split('"src":"'); k.splice(0,1);n.splice(0,1);
    	for(i=0;i<k.length;i++){	scr=k[i].substring(0,k[i].indexOf('"')); bgi=scr.substring(0,scr.length-5); var ch=scr.substring(scr.length-5,scr.length-4);
    		if(ch=='b'){k[i]='<img src="'+scr+'" title="'+ch+'" onclick="seeBig(\''+bgi+'\')" style="cursor:pointer;margin-top:0px;margin-left:0px;margin-bottom: 0px;margin-right: 1px">'}
    
    		else{k[i]='' }}
    	document.getElementById('pics').innerHTML=k.join('')
    }
    function seeBig(d){
    	window.open(d+'.jpg',Math.random()+'aWin','') 
    }
    
    </SCRIPT>
    
    </BODY></HTML>

Thread Information

Users Browsing this Thread

There are currently 1 users browsing this thread. (0 members and 1 guests)

Posting Permissions

  • You may not post new threads
  • You may not post replies
  • You may not post attachments
  • You may not edit your posts
  •  
HTML5 Development Center

"

"

X vBulletin 4.2.2 Debug Information

  • Page Generation 0.25368 seconds
  • Memory Usage 2,868KB
  • Queries Executed 15 (?)
More Information
Template Usage (34):
  • (1)SHOWTHREAD
  • (1)ad_footer_end
  • (1)ad_footer_start
  • (1)ad_global_above_footer
  • (1)ad_global_below_navbar
  • (1)ad_global_header1
  • (1)ad_global_header2
  • (1)ad_navbar_below
  • (1)ad_showthread_firstpost_sig
  • (1)ad_showthread_firstpost_start
  • (1)ad_thread_first_post_content
  • (1)ad_thread_last_post_content
  • (1)bbcode_code
  • (1)bbcode_html
  • (1)footer
  • (1)forumjump
  • (1)forumrules
  • (1)gobutton
  • (1)header
  • (1)headinclude
  • (1)headinclude_bottom
  • (3)memberaction_dropdown
  • (1)navbar
  • (4)navbar_link
  • (1)navbar_moderation
  • (1)navbar_noticebit
  • (1)navbar_tabs
  • (2)option
  • (3)postbit
  • (3)postbit_onlinestatus
  • (3)postbit_wrapper
  • (1)spacer_close
  • (1)spacer_open
  • (1)tagbit_wrapper 

Phrase Groups Available (6):
  • global
  • inlinemod
  • postbit
  • posting
  • reputationlevel
  • showthread
Included Files (26):
  • ./showthread.php
  • ./global.php
  • ./includes/class_bootstrap.php
  • ./includes/init.php
  • ./includes/class_core.php
  • ./includes/config.php
  • ./includes/functions.php
  • ./includes/functions_navigation.php
  • ./includes/class_friendly_url.php
  • ./includes/class_hook.php
  • ./includes/class_bootstrap_framework.php
  • ./vb/vb.php
  • ./vb/phrase.php
  • ./includes/functions_facebook.php
  • ./includes/functions_calendar.php
  • ./includes/functions_bigthree.php
  • ./includes/class_postbit.php
  • ./includes/class_bbcode.php
  • ./includes/functions_reputation.php
  • ./includes/functions_notice.php
  • ./packages/vbattach/attach.php
  • ./vb/types.php
  • ./vb/cache.php
  • ./vb/cache/db.php
  • ./vb/cache/observer/db.php
  • ./vb/cache/observer.php 

Hooks Called (72):
  • init_startup
  • friendlyurl_resolve_class
  • init_startup_session_setup_start
  • database_pre_fetch_array
  • database_post_fetch_array
  • init_startup_session_setup_complete
  • global_bootstrap_init_start
  • global_bootstrap_init_complete
  • cache_permissions
  • fetch_postinfo_query
  • fetch_postinfo
  • fetch_threadinfo_query
  • fetch_threadinfo
  • fetch_foruminfo
  • load_show_variables
  • load_forum_show_variables
  • global_state_check
  • global_bootstrap_complete
  • global_start
  • style_fetch
  • global_setup_complete
  • showthread_start
  • showthread_getinfo
  • strip_bbcode
  • friendlyurl_clean_fragment
  • friendlyurl_geturl
  • forumjump
  • cache_templates
  • cache_templates_process
  • template_register_var
  • template_render_output
  • fetch_template_start
  • fetch_template_complete
  • parse_templates
  • fetch_musername
  • notices_check_start
  • notices_noticebit
  • process_templates_complete
  • friendlyurl_redirect_canonical
  • showthread_post_start
  • showthread_query_postids
  • showthread_query
  • bbcode_fetch_tags
  • bbcode_create
  • showthread_postbit_create
  • postbit_factory
  • postbit_display_start
  • postbit_imicons
  • bbcode_parse_start
  • bbcode_parse_complete_precache
  • bbcode_parse_complete
  • postbit_display_complete
  • memberaction_dropdown
  • tag_fetchbit_complete
  • forumrules
  • navbits
  • navbits_complete
  • build_navigation_data
  • build_navigation_array
  • check_navigation_permission
  • process_navigation_links_start
  • process_navigation_links_complete
  • set_navigation_menu_element
  • build_navigation_menudata
  • build_navigation_listdata
  • build_navigation_list
  • set_navigation_tab_main
  • set_navigation_tab_fallback
  • navigation_tab_complete
  • fb_like_button
  • showthread_complete
  • page_templates