Index: HTMLParser.java
===================================================================
RCS file: /home/cvspublic/jakarta-lucene/src/demo/org/apache/lucene/demo/html/HTMLParser.java,v
retrieving revision 1.4
diff -u -r1.4 HTMLParser.java
--- HTMLParser.java 23 Nov 2003 18:37:32 -0000 1.4
+++ HTMLParser.java 2 Apr 2004 21:02:10 -0000
@@ -10,7 +10,8 @@
StringBuffer title = new StringBuffer(SUMMARY_LENGTH);
StringBuffer summary = new StringBuffer(SUMMARY_LENGTH * 2);
Properties metaTags=new Properties();
- String currentMetaTag="";
+ String currentMetaTag=null;
+ String currentMetaContent=null;
int length = 0;
boolean titleComplete = false;
boolean inTitle = false;
@@ -122,8 +123,10 @@
return;
if (inMetaTag)
{
- metaTags.setProperty(currentMetaTag, text);
- return;
+ metaTags.setProperty(currentMetaTag, currentMetaContent);
+ currentMetaTag = null;
+ currentMetaContent = null;
+ return;
}
if (inTitle)
title.append(text);
@@ -262,11 +265,17 @@
&& t2 != null)
{
currentMetaTag=t2.image.toLowerCase();
+ if(currentMetaTag != null && currentMetaContent != null) {
+ addText(t2.image);
+ }
}
if(inMetaTag && t1.image.equalsIgnoreCase("content") && t2 !=
null)
{
+ currentMetaContent=t2.image.toLowerCase();
+ if(currentMetaTag != null && currentMetaContent != null) {
addText(t2.image);
+ }
}
break;
default:
@@ -441,15 +450,15 @@
finally { jj_save(1, xla); }
}
- final private boolean jj_3_2() {
- if (jj_scan_token(ArgQuote2)) return true;
- if (jj_scan_token(CloseQuote2)) return true;
- return false;
- }
-
final private boolean jj_3_1() {
if (jj_scan_token(ArgQuote1)) return true;
if (jj_scan_token(CloseQuote1)) return true;
+ return false;
+ }
+
+ final private boolean jj_3_2() {
+ if (jj_scan_token(ArgQuote2)) return true;
+ if (jj_scan_token(CloseQuote2)) return true;
return false;
}