Voici le code JAVA :
-------------------------------------------
import java.io.BufferedReader;
import java.io.BufferedWriter;
import java.io.FileReader;
import java.io.FileWriter;
import java.io.InputStream;
import java.net.HttpURLConnection;
import java.net.URL;
public class TestCarac {
private String[] caracteres = {"\"", "<", ">", "¡", "¢", "£", "¤", "¥", "¦", "§", "¨", "©", "ª", "«", "¬", "", "®", "¯", "°", "±", "²", "³", "´", "µ", "¶", "·", "¸", "¹", "º", "»", "¼", "½", "¾", "¿", "À", "Á", "Â", "Ã", "Ä", "Å", "Æ", "Ç", "È", "É", "Ê", "Ë", "Ì", "Í", "Î", "Ï", "Ð", "Ñ", "Ò", "Ó", "Ô", "Õ", "Ö", "×", "Ø", "Ù", "Ú", "Û", "Ü", "Ý", "ß", "à", "á", "â", "ã", "ä", "å", "æ", "ç", "è", "é", "ê", "ë", "ì", "í", "î", "ï", "ð", "ñ", "ò", "ó", "ô", "õ", "ö", "÷", "ø", "ù", "ú", "û", "ü", "ý", "ÿ", "Œ", "œ", "Ÿ", "ˆ", "˜", "€", "™"};
private String[] entitesHTML = {""", "<", ">", "¡", "¢", "£", "¤", "¥", "¦", "§", "¨", "©", "ª", "«", "¬", "­", "®", "¯", "°", "±", "²", "³", "´", "µ", "¶", "·", "¸", "¹", "º", "»", "¼", "½", "¾", "¿", "À", "Á", "Â", "Ã", "Ä", "Å", "Æ", "Ç", "È", "É", "Ê", "Ë", "Ì", "Í", "Î", "Ï", "Ð", "Ñ", "Ò", "Ó", "Ô", "Õ", "Ö", "×", "Ø", "Ù", "Ú", "Û", "Ü", "Ý", "ß", "à", "á", "â", "ã", "ä", "å", "æ", "ç", "è", "é", "ê", "ë", "ì", "í", "î", "ï", "ð", "ñ", "ò", "ó", "ô", "õ", "ö", "÷", "ø", "ù", "ú", "û", "ü", "ý", "ÿ", "Œ", "œ", "Ÿ", "ˆ", "˜", "€", "™"};
public TestCarac() {
testHTML();
}
public void testHTML(){
System.out.println("Test HTML : ");
System.out.println("Récupération du code HTML...");
String source = recupHTML();
if (source.indexOf("acidulé") != -1){
System.out.println(" * mot acidulé trouvé dans le source\n");
}
else {
System.out.println(" * mot acidulé non trouvé dans le source\n");
}
if (source.indexOf("maraîcher") != -1){
System.out.println(" * mot maraîcher trouvé dans le source\n");
}
else {
System.out.println(" * mot maraîcher non trouvé dans le source\n");
}
try{
System.out.println("Ecriture du source dans fichier.");
BufferedWriter file = new BufferedWriter(new FileWriter("testHTML.txt"));
file.write(source);
file.newLine();
file.newLine();
file.flush();
System.out.println("Ecriture du source encodé dans fichier.");
file.write(encoder(source));
file.flush();
file.close();
}catch(Exception e) {
System.out.println(e.getMessage() + "\nErreur d'écriture du fichier testHTML.txt");
}
try {
System.out.println("Lecture du source depuis le fichier.");
BufferedReader br = new BufferedReader(new FileReader("testHTML.txt"));
String chaine="", ligne;
while ((ligne = br.readLine()) != null) {
chaine += ligne;
}
if (chaine.indexOf("acidulé") != -1){
System.out.println(" * mot acidulé trouvé dans le source\n");
}
else {
System.out.println(" * mot acidulé non trouvé dans le source\n");
}
if (chaine.indexOf("maraîcher") != -1){
System.out.println(" * mot maraîcher trouvé dans le source\n");
}
else {
System.out.println(" * mot maraîcher non trouvé dans le source\n");
}
br.close();
}catch (Exception e) {
System.out.println(e.getMessage() + "\nErreur de lecture du fichier testHTML.txt");
}
}
public String recupHTML(){
String source = "";
try {
URL adresse = new URL("[
www.legumes.ch]
;
// Etablissement de la connexion
HttpURLConnection connexion = (HttpURLConnection)adresse.openConnection();
// Récupération du code source
InputStream is = connexion.getInputStream();
int sizeRead;
int sizeAvailable = is.available();
if (sizeAvailable == 0){
sizeAvailable = 7719;
}
byte[] b = new byte[sizeAvailable];
while ((sizeRead = is.read(b)) != -1){
source += new String(b, 0, sizeRead);
b = new byte[sizeAvailable];
}
connexion.disconnect();
}
catch (Exception e) {
System.out.println(e.getMessage() + "\nErreur de récupération de code source.");
}
return source;
}
public String encoder(String chaine){
for (int i=0 ; i<caracteres.length ; i++){
chaine = chaine.replaceAll(caracteres
, entitesHTML);
}
return chaine;
}
public static void main(String[] args) {
new TestCarac();
}
}
-------------------------------------------
et donc aucun des mots recherchés n'est trouvé...
merci