Moteur de recherche en java

Question

Bonjour a tous , je souhaiterai créer un robot qui parcourera récursivement sur N niveaux, une liste d’URL donné en initialisation du programme. Merci d'avance Bon courage ! VOici mon code : package genie; import java.io.IOException; import java.io.InputStreamReader; import java.io.Reader; import java.net.URL; import java.net.URLConnection; import java.util.ArrayList; import java.util.HashMap; import java.util.Iterator; import java.util.StringTokenizer; import javax.swing.text.BadLocationException; import javax.swing.text.EditorKit; import javax.swing.text.SimpleAttributeSet; import javax.swing.text.html.HTML; import javax.swing.text.html.HTMLDocument; import javax.swing.text.html.HTMLEditorKit; /** * */ public class robot { @SuppressWarnings("unchecked") public HashMap Index ; @SuppressWarnings("unchecked") public robot () { Index = new HashMap (); } @SuppressWarnings("unchecked") public HashMap indexer(String adresse,int niveau) throws IOException, BadLocationException{ int cpt =0; //Charger la page en fonction de l'url URL url = new URL(adresse); URLConnection uconnection = url.openConnection(); Reader rd = new InputStreamReader(uconnection.getInputStream()); //lire le document HTML EditorKit kit = new HTMLEditorKit(); HTMLDocument doc = (HTMLDocument) kit.createDefaultDocument(); doc.putProperty("IgnoreCharsetDirective", new Boolean(true)); kit.read(rd, doc, 0); //Parcourir la balise lien HTMLDocument.Iterator it = doc.getIterator(HTML.Tag.A); while (it.isValid()) { SimpleAttributeSet s = (SimpleAttributeSet) it.getAttributes(); String link = (String) s.getAttribute(HTML.Attribute.HREF); if (link != null && link.startsWith("http") /*&& link.endsWith(".html")*/) { String titre=(String) s.getAttribute(HTML.Attribute.TITLE); //découpage des mots du titre du lien pour stockage dans le arraylist if(titre!=null){ StringTokenizer st = new StringTokenizer (titre," "); ArrayList tmp = new ArrayList () ; while (st.hasMoreTokens()){ String str=st.nextToken(); if(str.length()>2) tmp.add(str); } Index.put(link, tmp); } if(cpt<=niveau){ cpt++; indexer(link,niveau); } } it.next(); } return Index; } @SuppressWarnings("unchecked") public String rechercher (String recherche){ Iterator it = Index.keySet().iterator(); String adresse=""; ArrayList tmp = new ArrayList (); StringTokenizer st = new StringTokenizer (recherche," "); ArrayList mots = new ArrayList (); while(st.hasMoreTokens()){ String str=st.nextToken(); mots.add(str); } while (it.hasNext()){ String current = it.next(); tmp=Index.get(current); for(int i=0;i

cs_Julien39 · Answer

Quelle est ta question ?

Remarque : les @SuppressWarnings("unchecked") ne sont pas justifiés ici, tu ferais mieux de régler le problème

billouxs · Answer

Dsl si je n'étais pas clair , Aufait j'ai créer ce robot la et je souhaiterai qu'il parcourt récursivement sur N niveau , une liste d'URL !Genre le nombre de page que doit parcourir mon moteur de recherche !jespere que j'ai été plus clair Merci ! package genie; import java.io.IOException; import java.io.InputStreamReader; import java.io.Reader; import java.net.URL; import java.net.URLConnection; import java.util.ArrayList; import java.util.HashMap; import java.util.Iterator; import java.util.StringTokenizer; import javax.swing.text.BadLocationException; import javax.swing.text.EditorKit; import javax.swing.text.SimpleAttributeSet; import javax.swing.text.html.HTML; import javax.swing.text.html.HTMLDocument; import javax.swing.text.html.HTMLEditorKit; /** * */ public class robot { public HashMap Index ; public robot () { Index = new HashMap (); } public HashMap indexer(String adresse,int niveau) throws IOException, BadLocationException{ int cpt =0; //Charger la page en fonction de l'url URL url = new URL(adresse); URLConnection uconnection = url.openConnection(); Reader rd = new InputStreamReader(uconnection.getInputStream()); //lire le document HTML EditorKit kit = new HTMLEditorKit(); HTMLDocument doc = (HTMLDocument) kit.createDefaultDocument(); doc.putProperty("IgnoreCharsetDirective", new Boolean(true)); kit.read(rd, doc, 0); //Parcourir la balise lien HTMLDocument.Iterator it = doc.getIterator(HTML.Tag.A); while (it.isValid()) { SimpleAttributeSet s = (SimpleAttributeSet) it.getAttributes(); String link = (String) s.getAttribute(HTML.Attribute.HREF); if (link != null && link.startsWith("http") /*&& link.endsWith(".html")*/) { String titre=(String) s.getAttribute(HTML.Attribute.TITLE); //découpage des mots du titre du lien pour stockage dans le arraylist if(titre!=null){ StringTokenizer st = new StringTokenizer (titre," "); ArrayList tmp = new ArrayList () ; while (st.hasMoreTokens()){ String str=st.nextToken(); if(str.length()>2) tmp.add(str); } Index.put(link, tmp); } if(cpt<=niveau){ cpt++; indexer(link,niveau); } } it.next(); } return Index; } public String rechercher (String recherche){ Iterator it = Index.keySet().iterator(); String adresse=""; ArrayList tmp = new ArrayList (); StringTokenizer st = new StringTokenizer (recherche," "); ArrayList mots = new ArrayList (); while(st.hasMoreTokens()){ String str=st.nextToken(); mots.add(str); } while (it.hasNext()){ String current = it.next(); tmp=Index.get(current); for(int i=0;i

Moteur de recherche en java

2 réponses

Votre réponse

Discussions similaires